blob: 34a388904e38436ff0246a106461f34fa6299065 [file] [log] [blame]
Sundarajan Srinivasan1b03fe22014-12-02 13:20:56 -08001/*
2 **************************************************************************
3 * Copyright (c) 2014, The Linux Foundation. All rights reserved.
4 * Permission to use, copy, modify, and/or distribute this software for
5 * any purpose with or without fee is hereby granted, provided that the
6 * above copyright notice and this permission notice appear in all copies.
7 * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
8 * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
9 * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
10 * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
11 * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
12 * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
13 * OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
14 **************************************************************************
15 */
16
17/*
18 * profilenode.h
19 * device node for the profiler, to communicate with the linux driver
20 *
21 * WANRING:
22 * This file must present in both nss/source/pkg/profile/include for NSS driver,
23 * and linux-nbu/driver/.../nss for Linux driver
24 */
25
26#include "profilesample.h"
27
28#define UBI32_PROFILE_HD_MAGIC 0x4F525000 // 0 + "PRO"
29#define UBI32_PROFILE_HD_MAGIC_REV 0x0050524F // different endian
30#define UBI32_PROFILE_HD_MMASK 0xFFFFFF00 // 1st byte is Rx/Tx cmd
31#define UBI32_PROFILE_HD_MMASK_REV 0x00FFFFFF
32
33enum profile_cmds {
34 // cmds from HLOS to NSS
35 PROFILER_CHANGE_SAMPLING_RATE, // change sampling clock timer
36 PROFILER_START, // start/stop sampling engine
37 PROFILER_STOP,
38 PROFILER_FLOWCTRL, // info how many buffers available
39 DEBUG_RD_REQ, // I/O commands h2n
40 DEBUG_WR_REQ,
41 DEBUG_REPLY, // n2h respond
42
43 // data from NSS to HLOS
44 PROFILER_FIXED_INFO = 8, // set bit 3 for data
45 PROFILER_COUNTERS,
46 PROFILER_SAMPLES,
47};
48
49struct profile_sample_ctrl_header {
50 uint32_t hd_magic; // cmd + MAGIC for packet and endianess check
51
52 /*
53 * controlling data need to be sent to and used by upper layer (HLOS)
54 */
55 uint16_t count; // number of valid samples
56 uint16_t max_samples; // how many samples can be in the samples array
57 uint32_t dropped_samples; // how many samples did the profiler drop due to buffer overruns
58
59 /*
60 * info data -- sent to remote profiler tool (need swap)
61 */
62 struct profile_ext_header exh;
63
64};
65
66/*
67 * # of sample buffers in pbuf payload
68 */
69#ifndef PBUF_PAYLOAD_SIZE
70#define PBUF_PAYLOAD_SIZE 1792 // for HLOS driver: must sync with pbuf_public
71typedef enum meta_types {
72 PINGPONG_EMPTY,
73 PINGPONG_FULL,
74 PINGPONG_INUSE,
75} flowctrl_t;
76#else
77typedef enum pnode_c2h_metadata_types flowctrl_t; // for NSS driver
78#endif
79
80#define MAX_SAMPLES_PER_PBUF ((PBUF_PAYLOAD_SIZE - sizeof(struct profile_sample_ctrl_header)) / sizeof(struct profile_sample))
81
82struct n2h_meta_header {
83 flowctrl_t md_type; // N2H (NSS) and receiver (HLOS) flow control (meta type)
84 uint32_t d_len; // total data length start from psc_header
85};
86
87struct profile_session { // use for per session start
88 uint32_t hd_magic; // common ovarlay in all headers
Guojun Jin3deae8c2016-08-23 15:51:21 -070089 uint8_t num_counters; /* # performance (app) counters registered (changeable) */
90 uint8_t unused1B;
91 uint8_t nc_sts_sel_thrA;
92 uint8_t nc_sts_sel_thrB;
Sundarajan Srinivasan1b03fe22014-12-02 13:20:56 -080093 uint32_t ocm_size;
94 uint32_t sram_start;
95
96 uint32_t rate; // sampling rate
97 uint32_t cpu_id; // chip_id register
98 uint32_t cpu_freq; // chip clock
99 uint32_t ddr_freq; // DDR MEM speed
100 struct profile_counter counters[PROFILE_MAX_APP_COUNTERS];
101};
102
103struct profile_n2h_sample_buf {
104 struct n2h_meta_header mh;
105
106 struct profile_sample_ctrl_header psc_header; // per sample period
107 struct profile_sample samples[MAX_SAMPLES_PER_PBUF]; // per thread samples - for NSS send
108};
109
110struct profile_common {
111 struct profile_session un;
112 /*
113 * changable data sent everything pbuf
114 */
115 struct profile_n2h_sample_buf *pn2h; // sampling ctrl for this sample period
116 struct profile_sample *samples; // samples array was allocated by the linux driver
117 // now NSS points it to pbuf + pn2h header
118 uint16_t cur; // pos where driver take (read) samples
119 int16_t enabled; // Is the profiler enabled to take samples?
120};
121
122/*
123 * each buffer holds 4-7 sets (sample intrs) of samples; by average 5 sets per buffer,
124 * at 10ms smaple clock, 1s sleep in profilerd requires kernel to have 1000 / 10 / 5 = 20
125 * buffer to store one 1s samples. For higher sampling rate, either kernel needs more buffers
126 * or profilerd needs less sleep time, but both needs to make match.
127 */
128#define CCL_SIZE 32
129
130struct profile_io {
131 struct profile_common pnc;
132
133 /*
134 * control fields - HLOS
135 */
136 void *ctx; // nss_ctx for Linux driver
137 int profile_first_packet;
138 int profile_sequence_num;
139
140 /*
141 * circular buffers for psc_header/samples
142 */
143 struct profile_n2h_sample_buf *ccl;
144 int ccl_read;
145 int ccl_write;
146
147 /*
148 * data from HLOS -- used to generate sample->pid in ULTRA -- no longer needed in NSS
149 */
150 uint32_t *sw_ksp_ptr; // pointer to array (per hardware thread) of pointers to struct thread_info
151 uint32_t task_offset; // offset in bytes in thread_info to task_struct pointer
152 uint32_t pid_offset; // offset in bytes in task_struct to the PID
153};
154
155/*
156 * Krait <--> NSS debug mechanism. It lays over on profile_n2h_sample_buf.samples (ccl->samples)
157 */
158#define MAX_DB_WR 28 // profile_session has 31 4B words data (32W total with hd_magic) and
159#define MAX_DB_RD 30 // common has two more ptrs
160struct debug_box { // this overlays with profile_common (RD) or profile_session (WR)
161 uint32_t hd_magic; // cmd + MAGIC for packet and endianess check
162
163 uint32_t opts;
164 uint32_t *base_addr;
165 int32_t dlen; // in 4B words
166 uint32_t data[MAX_DB_RD];
167};
168
169#define DEBUG_OPT_BCTRL 1 // basic CTRL
170#define DEBUG_OPT_MOVEIO (1<<1) // force to use moveio in case new OCP range is added