1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
|
/***********************license start***************
* Copyright (c) 2003-2010 Cavium Inc. (support@cavium.com). All rights
* reserved.
*
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions are
* met:
*
* * Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* * Redistributions in binary form must reproduce the above
* copyright notice, this list of conditions and the following
* disclaimer in the documentation and/or other materials provided
* with the distribution.
* * Neither the name of Cavium Inc. nor the names of
* its contributors may be used to endorse or promote products
* derived from this software without specific prior written
* permission.
* This Software, including technical data, may be subject to U.S. export control
* laws, including the U.S. Export Administration Act and its associated
* regulations, and may be subject to export or import regulations in other
* countries.
* TO THE MAXIMUM EXTENT PERMITTED BY LAW, THE SOFTWARE IS PROVIDED "AS IS"
* AND WITH ALL FAULTS AND CAVIUM INC. MAKES NO PROMISES, REPRESENTATIONS OR
* WARRANTIES, EITHER EXPRESS, IMPLIED, STATUTORY, OR OTHERWISE, WITH RESPECT TO
* THE SOFTWARE, INCLUDING ITS CONDITION, ITS CONFORMITY TO ANY REPRESENTATION OR
* DESCRIPTION, OR THE EXISTENCE OF ANY LATENT OR PATENT DEFECTS, AND CAVIUM
* SPECIFICALLY DISCLAIMS ALL IMPLIED (IF ANY) WARRANTIES OF TITLE,
* MERCHANTABILITY, NONINFRINGEMENT, FITNESS FOR A PARTICULAR PURPOSE, LACK OF
* VIRUSES, ACCURACY OR COMPLETENESS, QUIET ENJOYMENT, QUIET POSSESSION OR
* CORRESPONDENCE TO DESCRIPTION. THE ENTIRE RISK ARISING OUT OF USE OR
* PERFORMANCE OF THE SOFTWARE LIES WITH YOU.
***********************license end**************************************/
//
// The function defined here is called for every function as it is executed.
// These calls are automatically inserted by GCC when the switch "-pg" is
// used. This allows cvmx-log to add a PC entry as each function is executed.
// This information, along with the timestamps can give the user a good idea
// of the performance characteristics of their program. This function normally
// takes about 22 cycles to execute.
//
#ifdef __linux__
#include <asm/asm.h>
#include <asm/regdef.h>
#define LA dla
#else
#include <machine/asm.h>
#include <machine/regdef.h>
#define LA la
#endif
.set noreorder
.set noat
LEAF(_mcount)
//
// All registers we use must be saved since calls are added by gcc
// after register allocation. The at register ($3) will contain the
// original ra register before the _mcount call. Also the compiler
// automatically performs a "dsubu sp, sp, 16" before we're called.
// At the end of this function all registers must have their original
// values and the stack pointr must be adjusted by 16. This code is
// pretty unreadable since it has been arranged to promote dual issue.
//
#ifdef __linux__
dsubu sp, sp, 32
#else
dsubu sp, sp, 16
#endif
sd s3, 24(sp) // Save register
rdhwr s3, $31 // Read the cycle count
sd s0, 0(sp) // Save register
LA s0, cvmx_log_buffer_end_ptr // Load the address of the end of the log buffer
sd s1, 8(sp) // Save register
LA s1, cvmx_log_buffer_write_ptr // Load the address of the location in the log buffer
sd s2, 16(sp) // Save register
ld s0, 0(s0) // Get value of the current log buffer end location
ld s2, 0(s1) // Get value of the current log buffer location
dsubu s0, s0, s2 // Subtract the end pointer and the write pointer
sltiu s0, s0, 16 // Check if there are at least 16 bytes
bne s0, $0, call_c_pc // Call the slow C function if we don't have room in the log
li s0, 0x001 // 11 bit constant that matches the first 11 bits of a CVMX_LOG_TYPE_PC header
sd ra, 8(s2) // Write the pc to the log
dins s3, s0, 53, 11 // Overwrite the upper cycle count bits with the CVMX_LOG_TYPE_PC header
sd s3, 0(s2) // Write the log header
daddu s2, s2, 16 // Increment the write location ptr
sd s2, 0(s1) // Store the write location ptr
return_c_pc:
ld s0, 0(sp) // Restore register
ld s1, 8(sp) // Restore register
ld s2, 16(sp) // Restore register
ld s3, 24(sp) // Restore register
daddu sp, sp, 32 // Pop everything off the stack, even the 16 bytes done by gcc
jr ra // Return to the caller and
or ra, $1, $1 // make sure the ra is back to its original value
call_c_pc:
// The registers used by the C code may change based on optimizations. To be
// safe, I'll save all registers. We're in the slow path case anyway.
dsubu sp, sp, 216
sd $1, 0(sp)
sd $2, 8(sp)
sd $3, 16(sp)
sd $4, 24(sp)
sd $5, 32(sp)
sd $6, 40(sp)
sd $7, 48(sp)
sd $8, 56(sp)
sd $9, 64(sp)
sd $10, 72(sp)
sd $11, 80(sp)
sd $12, 88(sp)
sd $13, 96(sp)
sd $14, 104(sp)
sd $15, 112(sp)
// s0, s1, s2, s3 are already saved
sd $20, 120(sp)
sd $21, 128(sp)
sd $22, 136(sp)
sd $23, 144(sp)
sd $24, 152(sp)
sd $25, 160(sp)
sd $26, 168(sp)
sd $27, 176(sp)
sd $28, 184(sp)
sd $29, 192(sp)
sd $30, 200(sp)
sd $31, 208(sp)
or a0, ra, ra
jal cvmx_log_pc
nop
ld $1, 0(sp)
ld $2, 8(sp)
ld $3, 16(sp)
ld $4, 24(sp)
ld $5, 32(sp)
ld $6, 40(sp)
ld $7, 48(sp)
ld $8, 56(sp)
ld $9, 64(sp)
ld $10, 72(sp)
ld $11, 80(sp)
ld $12, 88(sp)
ld $13, 96(sp)
ld $14, 104(sp)
ld $15, 112(sp)
// s0, s1, s2, s3 will be restored later
ld $20, 120(sp)
ld $21, 128(sp)
ld $22, 136(sp)
ld $23, 144(sp)
ld $24, 152(sp)
ld $25, 160(sp)
ld $26, 168(sp)
ld $27, 176(sp)
ld $28, 184(sp)
ld $29, 192(sp)
ld $30, 200(sp)
ld $31, 208(sp)
b return_c_pc
daddu sp, sp, 216
END(_mcount)
|