aboutsummaryrefslogtreecommitdiff
path: root/cvmx-log-arc.S
blob: bfb068e30d9eead502835d39514efbb55747042f (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
/***********************license start***************
 * Copyright (c) 2003-2010  Cavium Inc. (support@cavium.com). All rights 
 * reserved.
 *
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are
 * met:
 *
 *   * Redistributions of source code must retain the above copyright
 *     notice, this list of conditions and the following disclaimer.
 *
 *   * Redistributions in binary form must reproduce the above
 *     copyright notice, this list of conditions and the following
 *     disclaimer in the documentation and/or other materials provided
 *     with the distribution.

 *   * Neither the name of Cavium Inc. nor the names of
 *     its contributors may be used to endorse or promote products
 *     derived from this software without specific prior written
 *     permission.  

 * This Software, including technical data, may be subject to U.S. export  control
 * laws, including the U.S. Export Administration Act and its  associated
 * regulations, and may be subject to export or import  regulations in other
 * countries. 

 * TO THE MAXIMUM EXTENT PERMITTED BY LAW, THE SOFTWARE IS PROVIDED "AS IS" 
 * AND WITH ALL FAULTS AND CAVIUM INC. MAKES NO PROMISES, REPRESENTATIONS OR
 * WARRANTIES, EITHER EXPRESS, IMPLIED, STATUTORY, OR OTHERWISE, WITH RESPECT TO
 * THE SOFTWARE, INCLUDING ITS CONDITION, ITS CONFORMITY TO ANY REPRESENTATION OR
 * DESCRIPTION, OR THE EXISTENCE OF ANY LATENT OR PATENT DEFECTS, AND CAVIUM
 * SPECIFICALLY DISCLAIMS ALL IMPLIED (IF ANY) WARRANTIES OF TITLE,
 * MERCHANTABILITY, NONINFRINGEMENT, FITNESS FOR A PARTICULAR PURPOSE, LACK OF
 * VIRUSES, ACCURACY OR COMPLETENESS, QUIET ENJOYMENT, QUIET POSSESSION OR
 * CORRESPONDENCE TO DESCRIPTION. THE ENTIRE  RISK ARISING OUT OF USE OR
 * PERFORMANCE OF THE SOFTWARE LIES WITH YOU.
 ***********************license end**************************************/







//
// The function defined here is called for every function as it is executed.
// These calls are automatically inserted by GCC when the switch "-pg" is
// used. This allows cvmx-log to add a PC entry as each function is executed.
// This information, along with the timestamps can give the user a good idea
// of the performance characteristics of their program. This function normally
// takes about 22 cycles to execute.
//

#ifdef __linux__
#include <asm/asm.h>
#include <asm/regdef.h>
#define LA dla
#else
#include <machine/asm.h>
#include <machine/regdef.h>
#define LA la
#endif

.set noreorder
.set noat
LEAF(_mcount)
	//
	// All registers we use must be saved since calls are added by gcc
	// after register allocation. The at register ($3) will contain the
	// original ra register before the _mcount call. Also the compiler
	// automatically performs a "dsubu sp, sp, 16" before we're called.
	// At the end of this function all registers must have their original
	// values and the stack pointr must be adjusted by 16. This code is
	// pretty unreadable since it has been arranged to promote dual issue.
	//
#ifdef __linux__
	dsubu	sp, sp, 32
#else
	dsubu	sp, sp, 16
#endif
	sd	s3, 24(sp)				// Save register
	rdhwr	s3, $31					// Read the cycle count
	sd	s0, 0(sp)				// Save register
	LA	s0, cvmx_log_buffer_end_ptr		// Load the address of the end of the log buffer
	sd	s1, 8(sp)				// Save register
	LA	s1, cvmx_log_buffer_write_ptr		// Load the address of the location in the log buffer
	sd	s2, 16(sp)				// Save register
	ld	s0, 0(s0)				// Get value of the current log buffer end location
	ld	s2, 0(s1)				// Get value of the current log buffer location
	dsubu	s0, s0, s2				// Subtract the end pointer and the write pointer
	sltiu	s0, s0, 16				// Check if there are at least 16 bytes
	bne	s0, $0, call_c_pc			// Call the slow C function if we don't have room in the log
	li	s0, 0x001				// 11 bit constant that matches the first 11 bits of a CVMX_LOG_TYPE_PC header
	sd	ra, 8(s2)				// Write the pc to the log
	dins	s3, s0, 53, 11				// Overwrite the upper cycle count bits with the CVMX_LOG_TYPE_PC header
	sd	s3, 0(s2)				// Write the log header
	daddu	s2, s2, 16				// Increment the write location ptr
	sd	s2, 0(s1)				// Store the write location ptr
return_c_pc:
	ld	s0, 0(sp)				// Restore register
	ld	s1, 8(sp)				// Restore register
	ld	s2, 16(sp)				// Restore register
	ld	s3, 24(sp)				// Restore register
	daddu	sp, sp, 32				// Pop everything off the stack, even the 16 bytes done by gcc
	jr	ra					// Return to the caller and
	or	ra, $1, $1				// make sure the ra is back to its original value

call_c_pc:
	// The registers used by the C code may change based on optimizations. To be
	// safe, I'll save all registers. We're in the slow path case anyway.
	dsubu	sp, sp, 216
	sd	$1, 0(sp)
	sd	$2, 8(sp)
	sd	$3, 16(sp)
	sd 	$4, 24(sp)
	sd 	$5, 32(sp)
	sd	$6, 40(sp)
	sd	$7, 48(sp)
	sd	$8, 56(sp)
	sd	$9, 64(sp)
	sd	$10, 72(sp)
	sd	$11, 80(sp)
	sd	$12, 88(sp)
	sd	$13, 96(sp)
	sd	$14, 104(sp)
	sd	$15, 112(sp)
	// s0, s1, s2, s3 are already saved
	sd	$20, 120(sp)
	sd	$21, 128(sp)
	sd	$22, 136(sp)
	sd	$23, 144(sp)
	sd	$24, 152(sp)
	sd	$25, 160(sp)
	sd	$26, 168(sp)
	sd	$27, 176(sp)
	sd	$28, 184(sp)
	sd	$29, 192(sp)
	sd	$30, 200(sp)
	sd	$31, 208(sp)

	or	a0, ra, ra
	jal	cvmx_log_pc
	nop

	ld	$1, 0(sp)
	ld	$2, 8(sp)
	ld	$3, 16(sp)
	ld 	$4, 24(sp)
	ld 	$5, 32(sp)
	ld	$6, 40(sp)
	ld	$7, 48(sp)
	ld	$8, 56(sp)
	ld	$9, 64(sp)
	ld	$10, 72(sp)
	ld	$11, 80(sp)
	ld	$12, 88(sp)
	ld	$13, 96(sp)
	ld	$14, 104(sp)
	ld	$15, 112(sp)
	// s0, s1, s2, s3 will be restored later
	ld	$20, 120(sp)
	ld	$21, 128(sp)
	ld	$22, 136(sp)
	ld	$23, 144(sp)
	ld	$24, 152(sp)
	ld	$25, 160(sp)
	ld	$26, 168(sp)
	ld	$27, 176(sp)
	ld	$28, 184(sp)
	ld	$29, 192(sp)
	ld	$30, 200(sp)
	ld	$31, 208(sp)
	b	return_c_pc
	daddu	sp, sp, 216

END(_mcount)