xref: /linux-tools/perf/profiler/profiler.cpp (revision 4092c028975ca3f60c7b40101bb2099527aa80e7)
178c68143SDavid Wang #include <stdlib.h>
278c68143SDavid Wang #include <stdio.h>
378c68143SDavid Wang #include <unistd.h>
478c68143SDavid Wang #include <string.h>
578c68143SDavid Wang #include <sys/ioctl.h>
678c68143SDavid Wang #include <linux/perf_event.h>
778c68143SDavid Wang #include <asm/unistd.h>
878c68143SDavid Wang #include <sys/mman.h>
978c68143SDavid Wang #include <sys/stat.h>
1078c68143SDavid Wang #include <poll.h>
1178c68143SDavid Wang #include <signal.h>
1278c68143SDavid Wang #include <fcntl.h>
1378c68143SDavid Wang #include <elf.h>
1478c68143SDavid Wang #include <string.h>
1578c68143SDavid Wang 
1678c68143SDavid Wang #include <vector>
1778c68143SDavid Wang #include <string>
1878c68143SDavid Wang #include <map>
1978c68143SDavid Wang #include <unordered_map>
2078c68143SDavid Wang #include <algorithm>
2178c68143SDavid Wang using namespace std;
2278c68143SDavid Wang 
2378c68143SDavid Wang 
2478c68143SDavid Wang #define MAXN  128
2578c68143SDavid Wang #define MAXCPU 1024
2678c68143SDavid Wang #define error(msg) do { perror(msg); exit(1); } while(0)
2778c68143SDavid Wang //--------------------------------Tree for call chain and report-------------------------------
2878c68143SDavid Wang //
2978c68143SDavid Wang struct TNode {
3078c68143SDavid Wang     int c=0;
3178c68143SDavid Wang     unordered_map<string, TNode*> s;
3278c68143SDavid Wang     struct TNode *add(string n) {
3378c68143SDavid Wang         c++;
3478c68143SDavid Wang         if (s[n]==nullptr) s[n] = new TNode();
3578c68143SDavid Wang         return s[n];
3678c68143SDavid Wang     }
3778c68143SDavid Wang     int printit(FILE *fp, int k) {
3878c68143SDavid Wang         if (s.size()) {
3978c68143SDavid Wang             using tt = tuple<int, string, TNode*>;
4078c68143SDavid Wang             vector<tt> xx;
4178c68143SDavid Wang             for (auto x: s) xx.push_back(make_tuple(x.second->c, x.first, x.second));
4278c68143SDavid Wang             sort(begin(xx), end(xx), greater<tt>());
4378c68143SDavid Wang             for (auto x: xx) {
4478c68143SDavid Wang                 auto count = get<0>(x);
4578c68143SDavid Wang                 if (100.0*count/c<1) continue;
4678c68143SDavid Wang                 auto name = get<1>(x);
4778c68143SDavid Wang                 auto nx = get<2>(x);
4878c68143SDavid Wang                 fprintf(fp, "<li>\n");
4978c68143SDavid Wang                 fprintf(fp, "<input type=\"checkbox\" id=\"c%d\" />\n", k);
5078c68143SDavid Wang                 fprintf(fp, "<label class=\"tree_label\" for=\"c%d\">%s(%.3f%% %d/%d)</label>\n", k, name.c_str(), 100.0*count/c, count, c);
5178c68143SDavid Wang                 fprintf(fp, "<ul>\n");
5278c68143SDavid Wang                 // printf("%s(%.3f%% %d/%d)\n", name.c_str(), 100.0*count/c, count, c);
5378c68143SDavid Wang                 k = nx->printit(fp, k+1);
5478c68143SDavid Wang                 fprintf(fp, "</ul>\n");
5578c68143SDavid Wang                 fprintf(fp, "</li>\n");
5678c68143SDavid Wang             }
5778c68143SDavid Wang         }
5878c68143SDavid Wang         return k;
5978c68143SDavid Wang     }
6078c68143SDavid Wang };
6178c68143SDavid Wang 
6278c68143SDavid Wang //--------------------------------symbols-------------------------------------------
6378c68143SDavid Wang using STORE_T = map<unsigned long long, pair<string, unsigned long long>>;
6478c68143SDavid Wang using K_STORE_T = map<unsigned long long, string>;
6578c68143SDavid Wang 
6678c68143SDavid Wang /*
6778c68143SDavid Wang  * load FUNC symbols refering to the section indicated by the offset, relocate the virtual address
6878c68143SDavid Wang  */
6978c68143SDavid Wang void parse_elf64(FILE *fp, unsigned long long v_addr, unsigned long long v_size, unsigned long long v_offset, STORE_T& store) {
7078c68143SDavid Wang     // printf("read elf with offset 0x%llx, addr 0x%llx\n", v_offset, v_addr);
7178c68143SDavid Wang     Elf64_Ehdr ehdr;
7278c68143SDavid Wang     int rc = fread(&ehdr, sizeof(ehdr), 1, fp);
7378c68143SDavid Wang     if (rc != 1) return;
7478c68143SDavid Wang     int n, s, i;
7578c68143SDavid Wang     unsigned long long offset;
7678c68143SDavid Wang 
7778c68143SDavid Wang     // load program headers
7878c68143SDavid Wang     unsigned long long p_vaddr, p_size;
7978c68143SDavid Wang     n = ehdr.e_phnum;
8078c68143SDavid Wang     s = ehdr.e_phentsize;
8178c68143SDavid Wang     offset = ehdr.e_phoff;
8278c68143SDavid Wang     Elf64_Phdr phdr;
8378c68143SDavid Wang     for (i=0; i<n; i++) {
8478c68143SDavid Wang         rc = fseek(fp, offset, SEEK_SET);
8578c68143SDavid Wang         if (rc<0) { perror("fail to seek"); return; }
8678c68143SDavid Wang         rc = fread(&phdr, sizeof(phdr), 1, fp);
8778c68143SDavid Wang         if (rc != 1) { perror("fail to read program header"); return; }
8878c68143SDavid Wang         if (phdr.p_flags&PF_X) {
8978c68143SDavid Wang             if (phdr.p_offset == v_offset) {
9078c68143SDavid Wang                 p_vaddr = phdr.p_vaddr;
9178c68143SDavid Wang                 p_size = phdr.p_memsz; if (p_size==0) p_size = 0xffffffff;
9278c68143SDavid Wang                 break;
9378c68143SDavid Wang             }
9478c68143SDavid Wang         }
9578c68143SDavid Wang         offset+=s;
9678c68143SDavid Wang     }
9778c68143SDavid Wang     if (i>=n) { printf("No program header match offset found, fail to load\n"); return; }
9878c68143SDavid Wang 
9978c68143SDavid Wang     // load section headers
10078c68143SDavid Wang     n = ehdr.e_shnum;
10178c68143SDavid Wang     s = ehdr.e_shentsize;
10278c68143SDavid Wang     offset = ehdr.e_shoff;
10378c68143SDavid Wang     Elf64_Shdr shdr;
10478c68143SDavid Wang     vector<Elf64_Shdr> headers;
10578c68143SDavid Wang     for (int i=0; i<n; i++) {
10678c68143SDavid Wang         rc = fseek(fp, offset, SEEK_SET);
10778c68143SDavid Wang         if (rc<0) { perror("fail to seek"); return; }
10878c68143SDavid Wang         rc = fread(&shdr, sizeof(shdr), 1, fp);
10978c68143SDavid Wang         if (rc != 1) { perror("fail to read sec header"); return; }
11078c68143SDavid Wang         headers.push_back(shdr);
11178c68143SDavid Wang         offset+=s;
11278c68143SDavid Wang     }
11378c68143SDavid Wang     Elf64_Sym symb;
11478c68143SDavid Wang     unsigned long long faddr, fsize;
11578c68143SDavid Wang     unsigned long long size, item_size;
11678c68143SDavid Wang     int link, ix, flink, k;
11778c68143SDavid Wang     char fname[128];
11878c68143SDavid Wang     for (int i=0; i<n; i++) {
11978c68143SDavid Wang         switch(headers[i].sh_type) {
12078c68143SDavid Wang             case SHT_SYMTAB:
12178c68143SDavid Wang             case SHT_DYNSYM:
12278c68143SDavid Wang                 offset = headers[i].sh_offset;
12378c68143SDavid Wang                 size = headers[i].sh_size;
12478c68143SDavid Wang                 item_size = headers[i].sh_entsize;
12578c68143SDavid Wang                 link = headers[i].sh_link;
12678c68143SDavid Wang                 if (link<=0) break;
12778c68143SDavid Wang                 for (k=0; k+item_size<=size; k+=item_size) {
12878c68143SDavid Wang                     rc = fseek(fp, offset+k, SEEK_SET); if (rc<0) continue;
12978c68143SDavid Wang                     rc = fread(&symb, sizeof(symb), 1, fp); if (rc != 1) continue;
13078c68143SDavid Wang                     if (ELF64_ST_TYPE(symb.st_info) != STT_FUNC ) continue;
13178c68143SDavid Wang                     flink = symb.st_shndx; if (flink==0) continue;
13278c68143SDavid Wang                     fsize = symb.st_size; if (fsize==0) continue;
13378c68143SDavid Wang                     faddr = symb.st_value; if (faddr>p_vaddr+p_size) continue;
13478c68143SDavid Wang                     ix = symb.st_name; if (ix==0) continue;
13578c68143SDavid Wang                     rc = fseek(fp, headers[link].sh_offset+ix, SEEK_SET); if (rc<0) continue;
13678c68143SDavid Wang                     if (fgets(fname, sizeof(fname), fp)==NULL) continue;
13778c68143SDavid Wang                     faddr = faddr-p_vaddr+v_addr;
13878c68143SDavid Wang                     store[faddr] = make_pair(string(fname), fsize);
13978c68143SDavid Wang                 }
14078c68143SDavid Wang                 break;
14178c68143SDavid Wang             default:
14278c68143SDavid Wang                 break;
14378c68143SDavid Wang         }
14478c68143SDavid Wang     }
14578c68143SDavid Wang }
14678c68143SDavid Wang 
14778c68143SDavid Wang int load_symbol_from_file(const char *path, unsigned long long addr, unsigned long long size, unsigned long long offset, STORE_T& store) {
14878c68143SDavid Wang     printf("loading symble from %s\n", path);
14978c68143SDavid Wang     FILE *fp = fopen(path, "rb");
15078c68143SDavid Wang     if (fp==NULL) { perror("fail to open file"); return -1; }
15178c68143SDavid Wang     char ident[EI_NIDENT], c;
15278c68143SDavid Wang     int err=0;
15378c68143SDavid Wang     int rc = fread(ident, sizeof(ident), 1, fp);
15478c68143SDavid Wang     if (rc != 1) { perror("fail to read ident"); err=-1; goto end; }
15578c68143SDavid Wang     if (ident[0]!=0x7f) { printf("not a elf file\n"); err=-1; goto  end; }
15678c68143SDavid Wang     c=ident[4];
15778c68143SDavid Wang     rc = fseek(fp, 0, SEEK_SET); if (rc<0) { perror("fail to rewind"); goto end; }
15878c68143SDavid Wang     if (c == ELFCLASS32) {
15978c68143SDavid Wang         printf("32bit elf not supported yet\n"); err=-2; goto end;
16078c68143SDavid Wang     } else if (c == ELFCLASS64) {
16178c68143SDavid Wang         parse_elf64(fp, addr, size, offset, store);
16278c68143SDavid Wang     }
16378c68143SDavid Wang 
16478c68143SDavid Wang end:
16578c68143SDavid Wang     fclose(fp);
16678c68143SDavid Wang     return err;
16778c68143SDavid Wang }
16878c68143SDavid Wang 
16978c68143SDavid Wang static unsigned long long parse_hex(char *p, int *n) {
17078c68143SDavid Wang     unsigned long long r=0;
17178c68143SDavid Wang     int i=0;
17278c68143SDavid Wang     *n = 0;
17378c68143SDavid Wang     while(p[i]==' '||p[i]=='\t') i++;
17478c68143SDavid Wang     if (p[i]==0) return 0;
17578c68143SDavid Wang     if (p[i+1]=='x') i+=2;
17678c68143SDavid Wang     int v;
17778c68143SDavid Wang     while(p[i]) {
17878c68143SDavid Wang         if (p[i]>='0'&&p[i]<='9') v=p[i]-'0';
17978c68143SDavid Wang         else if (p[i]>='a'&&p[i]<='f') v=10+p[i]-'a';
18078c68143SDavid Wang         else if (p[i]>='A'&&p[i]<='F') v=10+p[i]-'A';
18178c68143SDavid Wang         else break;
18278c68143SDavid Wang         r=(r<<4)+v;
18378c68143SDavid Wang         i++;
18478c68143SDavid Wang     }
18578c68143SDavid Wang     *n = i;
18678c68143SDavid Wang     return r;
18778c68143SDavid Wang }
18878c68143SDavid Wang 
18978c68143SDavid Wang STORE_T*  load_symbol_pid(int pid) {
19078c68143SDavid Wang     printf("loading symbols for %d\n", pid);
19178c68143SDavid Wang     char bb[128];
19278c68143SDavid Wang     sprintf(bb, "/proc/%d/maps", pid);
19378c68143SDavid Wang     FILE* fp = fopen(bb, "r");
19478c68143SDavid Wang     if (fp==NULL) return NULL;
19578c68143SDavid Wang     STORE_T *store = new STORE_T();
19678c68143SDavid Wang     unsigned long long start, end, offset;
19778c68143SDavid Wang     char *p;
19878c68143SDavid Wang     int i, c, j;
19978c68143SDavid Wang     while(1) {
20078c68143SDavid Wang         p=fgets(bb, sizeof(bb), fp); if (p==NULL) break;
20178c68143SDavid Wang         i=0; c=0;
20278c68143SDavid Wang         start = parse_hex(p, &c); if (start==0) continue; i+=c; if (p[i]!='-') continue; i++;
20378c68143SDavid Wang         end = parse_hex(p+i, &c); if (end==0) continue; i+=c;
20478c68143SDavid Wang         // parse type
20578c68143SDavid Wang         for (j=0; j<8; j++) { if (p[i]=='x') break; i++; } if (j>=8) continue;
20678c68143SDavid Wang         while(p[i]!=' '&&p[i]!='\t'&&p[i]!=0) i++; if (p[i]==0) continue;
20778c68143SDavid Wang         offset = parse_hex(p+i, &c); if (c==0) continue;
20878c68143SDavid Wang         // remaining should contains '/' indicating this mmap is refering to a file
20978c68143SDavid Wang         while(p[i]&&p[i]!='/') i++; if (p[i]==0) continue;
21078c68143SDavid Wang         sprintf(bb, "/proc/%d/map_files/%llx-%llx", pid, start, end);
21178c68143SDavid Wang         load_symbol_from_file(bb, start, end-start, offset, *store);
21278c68143SDavid Wang     }
21378c68143SDavid Wang     fclose(fp);
21478c68143SDavid Wang     return store;
21578c68143SDavid Wang }
21678c68143SDavid Wang 
21778c68143SDavid Wang /* parse kernel func symbols from /proc/kallsyms */
21878c68143SDavid Wang K_STORE_T* load_kernel() {
21978c68143SDavid Wang     FILE* fp = fopen("/proc/kallsyms", "r");
22078c68143SDavid Wang     if (fp == NULL) return NULL;
22178c68143SDavid Wang     char *p;
22278c68143SDavid Wang     unsigned long long addr;
22378c68143SDavid Wang     int c;
22478c68143SDavid Wang     K_STORE_T* store = new K_STORE_T();
22578c68143SDavid Wang     char bb[128], adr[128], type[8], name[128];
22678c68143SDavid Wang     while(1) {
22778c68143SDavid Wang         p = fgets(bb, sizeof(bb), fp); if (p==NULL) break;
22878c68143SDavid Wang         if (sscanf(p, "%s %s %s", adr, type, name)!=3) continue;;
22978c68143SDavid Wang         if (type[0]!='t'&&type[0]!='T') continue;
23078c68143SDavid Wang         addr=parse_hex(adr, &c); if (c==0) continue;
23178c68143SDavid Wang         (*store)[addr] = string(name);
23278c68143SDavid Wang     }
23378c68143SDavid Wang     return store;
23478c68143SDavid Wang     fclose(fp);
23578c68143SDavid Wang }
23678c68143SDavid Wang 
23778c68143SDavid Wang //------------------------------perf profiler-------------------------
23878c68143SDavid Wang static long perf_event_open(struct perf_event_attr *perf_event, pid_t pid, int cpu, int group_fd, unsigned long flags) {
23978c68143SDavid Wang     return syscall(__NR_perf_event_open, perf_event, pid, cpu, group_fd, flags);
24078c68143SDavid Wang }
24178c68143SDavid Wang unordered_map<int, STORE_T*> pid_symbols;
24278c68143SDavid Wang K_STORE_T* kernel_symbols = NULL;
24378c68143SDavid Wang 
24478c68143SDavid Wang struct pollfd polls[MAXCPU];
24578c68143SDavid Wang // res for cleanup
24678c68143SDavid Wang static long long psize;
24778c68143SDavid Wang map<int, pair<void*, long long>> res;
24878c68143SDavid Wang TNode* gnode = NULL;
24978c68143SDavid Wang 
25078c68143SDavid Wang void int_exit(int _) {
25178c68143SDavid Wang     for (auto x: res) {
25278c68143SDavid Wang         auto y = x.second;
25378c68143SDavid Wang         void* addr = y.first;
25478c68143SDavid Wang         munmap(addr, (1+MAXN)*psize);
25578c68143SDavid Wang         close(x.first);
25678c68143SDavid Wang     }
25778c68143SDavid Wang     res.clear();
25878c68143SDavid Wang     if (gnode!=NULL) {
25978c68143SDavid Wang         FILE* fp = fopen("./report.html", "w");
26078c68143SDavid Wang         if (fp) {
26178c68143SDavid Wang             fprintf(fp, "<head> <link rel=\"stylesheet\" href=\"report.css\"> <script src=\"report.js\"> </script> </head>\n");
26278c68143SDavid Wang             fprintf(fp, "<ul class=\"tree\">\n");
26378c68143SDavid Wang             gnode->printit(fp, 0);
26478c68143SDavid Wang             fprintf(fp, "</ul>\n");
26578c68143SDavid Wang             fclose(fp);
26678c68143SDavid Wang             printf("report done\n");
26778c68143SDavid Wang         }
26878c68143SDavid Wang         gnode = NULL;
26978c68143SDavid Wang     }
27078c68143SDavid Wang }
27178c68143SDavid Wang /*
27278c68143SDavid Wang perf call chain process
27378c68143SDavid Wang For now, if a address would not be located to some function, the address would be skipped.
27478c68143SDavid Wang  */
27578c68143SDavid Wang int process_event(char *base, unsigned long long size, unsigned long long offset) {
27678c68143SDavid Wang     struct perf_event_header* p = NULL;
27778c68143SDavid Wang     int pid, xpid;
27878c68143SDavid Wang     unsigned long long time;
27978c68143SDavid Wang     offset%=size;
28078c68143SDavid Wang     // assuming the header would fit within size
28178c68143SDavid Wang     p = (struct perf_event_header*) (base+offset);
28278c68143SDavid Wang     offset+=sizeof(*p); if (offset>=size) offset-=size;
28378c68143SDavid Wang     if (p->type != PERF_RECORD_SAMPLE) return p->size;
28478c68143SDavid Wang     // pid, tip;
28578c68143SDavid Wang     pid = *((int *)(base+offset));  offset+=8; if (offset>=size) offset-=size;
28678c68143SDavid Wang     unsigned long long nr = *((unsigned long long*)(base+offset)); offset+=8; if (offset>=size) offset-=size;
28778c68143SDavid Wang     unsigned long long addr, o, addr0;
28878c68143SDavid Wang     if (nr) {
28978c68143SDavid Wang         if (gnode==NULL) gnode=new TNode();
29078c68143SDavid Wang         char bb[64];
29178c68143SDavid Wang         TNode* r = gnode;
29278c68143SDavid Wang         if (pid_symbols.count(pid)==0) pid_symbols[pid] = load_symbol_pid(pid);
29378c68143SDavid Wang         STORE_T* px = pid_symbols[pid];
29478c68143SDavid Wang         addr0 = *((unsigned long long *)(base+offset));
29578c68143SDavid Wang         char user_mark = 0;
29678c68143SDavid Wang         for (int i=nr-1; i>=0; i--) {
29778c68143SDavid Wang             o = i*8+offset; if (o>=size) o-=size;
29878c68143SDavid Wang             addr = *((unsigned long long*)(base+o));
29978c68143SDavid Wang             if ((addr>>56)==(addr0>>56) && (p->misc&PERF_RECORD_MISC_KERNEL)) {
30078c68143SDavid Wang                 // skip the cross line command, no idear how to correctly resolve it now.
30178c68143SDavid Wang                 if (user_mark) { user_mark=0; continue; }
30278c68143SDavid Wang                 // check in kernel
30378c68143SDavid Wang                 if (kernel_symbols&&!kernel_symbols->empty()) {
30478c68143SDavid Wang                     auto x = kernel_symbols->upper_bound(addr);
30578c68143SDavid Wang                     if (x==kernel_symbols->begin()) {
30678c68143SDavid Wang                         // sprintf(bb, "0x%llx", addr); r = r->add(string(bb));
30778c68143SDavid Wang                     } else {
30878c68143SDavid Wang                         x--;
30978c68143SDavid Wang                         r = r->add((*x).second);
31078c68143SDavid Wang                     }
31178c68143SDavid Wang                 } else {
31278c68143SDavid Wang                     // sprintf(bb, "0x%llx", addr); r = r->add(string(bb));
31378c68143SDavid Wang                 }
31478c68143SDavid Wang             } else {
31578c68143SDavid Wang                 if (px) {
31678c68143SDavid Wang                     auto x = px->upper_bound(addr);
31778c68143SDavid Wang                     if (x==px->begin()) {
31878c68143SDavid Wang                         // sprintf(bb, "0x%llx", addr); r = r->add(string(bb));
31978c68143SDavid Wang                     } else {
32078c68143SDavid Wang                         x--;
32178c68143SDavid Wang                         auto y = (*x).second;
32278c68143SDavid Wang                         if (addr>(*x).first+y.second) {
32378c68143SDavid Wang                             // r = r->add(y.first);
32478c68143SDavid Wang                             // sprintf(bb, "0x%llx", addr); r = r->add(string(bb));
32578c68143SDavid Wang                         } else {
32678c68143SDavid Wang                             r = r->add(y.first);
32778c68143SDavid Wang                         }
32878c68143SDavid Wang                     }
32978c68143SDavid Wang                 } else {
33078c68143SDavid Wang                     // sprintf(bb, "0x%llx", addr); r = r->add(string(bb));
33178c68143SDavid Wang                 }
33278c68143SDavid Wang                 user_mark=1;
33378c68143SDavid Wang             }
33478c68143SDavid Wang         }
33578c68143SDavid Wang     }
33678c68143SDavid Wang     return p->size;
33778c68143SDavid Wang }
33878c68143SDavid Wang 
33978c68143SDavid Wang int main(int argc, char *argv[]) {
34078c68143SDavid Wang     kernel_symbols = load_kernel();
341*4092c028SDavid Wang     if (argc<2) { printf("Need pid\n"); return 1; }
34278c68143SDavid Wang     int pid = atoi(argv[1]); if (pid<=0) { printf("invalid pid %s\n", argv[1]); return 1; }
34378c68143SDavid Wang     // find cgroup
34478c68143SDavid Wang     char xb[256], xb2[256];
34578c68143SDavid Wang     int i, j, k, fd;
34678c68143SDavid Wang     void* addr;
34778c68143SDavid Wang     sprintf(xb, "/proc/%d/cgroup", pid);
34878c68143SDavid Wang     FILE* fp = fopen(xb, "r");
34978c68143SDavid Wang     if (fp==NULL) error("fail to open cgroup file");
35078c68143SDavid Wang     char *p;
35178c68143SDavid Wang     xb2[0]=0;
352*4092c028SDavid Wang     int cgroup_name_len=0;
35378c68143SDavid Wang     while(1) {
35478c68143SDavid Wang         p = fgets(xb, sizeof(xb), fp); if (p==NULL) break;
35578c68143SDavid Wang         i=0; while(p[i]&&p[i]!=':') i++; if (p[i]==0) continue;
35678c68143SDavid Wang         if (strstr(p, "perf_event")) {
35778c68143SDavid Wang             i++; while(p[i]!=':'&&p[i]) i++;  if (p[i]!=':') continue; i++;
35878c68143SDavid Wang             j=i; while(p[j]!='\r'&&p[j]!='\n'&&p[j]!=0) j++; p[j]=0;
35978c68143SDavid Wang             sprintf(xb2, "/sys/fs/cgroup/perf_event%s", p+i);
360*4092c028SDavid Wang             cgroup_name_len=j-i;
36178c68143SDavid Wang             break;
36278c68143SDavid Wang         } else if (p[i+1]==':') {
36378c68143SDavid Wang             i+=2; j=i; while(p[j]!='\r'&&p[j]!='\n'&&p[j]!=0) j++; p[j]=0;
36478c68143SDavid Wang             sprintf(xb2, "/sys/fs/cgroup/%s", p+i);
365*4092c028SDavid Wang             cgroup_name_len=j-i;
36678c68143SDavid Wang         }
36778c68143SDavid Wang     }
36878c68143SDavid Wang     fclose(fp);
36978c68143SDavid Wang     if (xb2[0]==0) error("no proper cgroup found\n");
370*4092c028SDavid Wang     if (cgroup_name_len<2) {
371*4092c028SDavid Wang         printf("cgroup %s seems to be root, not allowed\n", xb2);
372*4092c028SDavid Wang         return -1;
373*4092c028SDavid Wang     }
37478c68143SDavid Wang     printf("try to use cgroup %s\n", xb2);
37578c68143SDavid Wang     int cgroup_id = open(xb2, O_CLOEXEC);
37678c68143SDavid Wang     if (cgroup_id<=0) { perror("error open cgroup dir"); return 1; }
37778c68143SDavid Wang     // start perf event
37878c68143SDavid Wang     psize = sysconf(_SC_PAGE_SIZE); // getpagesize();
37978c68143SDavid Wang     int cpu_num = sysconf(_SC_NPROCESSORS_ONLN);
38078c68143SDavid Wang 	struct perf_event_attr attr;
38178c68143SDavid Wang     memset(&attr, 0, sizeof(attr));
38278c68143SDavid Wang     attr.type = PERF_TYPE_SOFTWARE;
38378c68143SDavid Wang     attr.size = sizeof(attr);
38478c68143SDavid Wang     attr.config = PERF_COUNT_SW_CPU_CLOCK;
38578c68143SDavid Wang     attr.sample_freq = 369; // adjust it
38678c68143SDavid Wang     attr.freq = 1;
38778c68143SDavid Wang     attr.wakeup_events = 32;
38878c68143SDavid Wang     attr.sample_type = PERF_SAMPLE_TID|PERF_SAMPLE_CALLCHAIN;
38978c68143SDavid Wang     for (i=0, k=0; i<cpu_num&&i<MAXCPU; i++) {
39078c68143SDavid Wang         printf("attaching cpu %d\n", i);
39178c68143SDavid Wang         fd = perf_event_open(&attr, cgroup_id, i, -1, PERF_FLAG_FD_CLOEXEC|PERF_FLAG_PID_CGROUP);
39278c68143SDavid Wang         if (fd<0) { perror("fail to open perf event"); continue; }
39378c68143SDavid Wang         addr = mmap(NULL, (1+MAXN)*psize, PROT_READ, MAP_SHARED, fd, 0);
39478c68143SDavid Wang         if (addr == MAP_FAILED) { perror("mmap failed"); close(fd); continue; }
39578c68143SDavid Wang         res[fd] = make_pair(addr, 0);
39678c68143SDavid Wang         polls[k].fd = fd;
39778c68143SDavid Wang         polls[k].events = POLLIN;
39878c68143SDavid Wang         polls[k].revents = 0;
39978c68143SDavid Wang         k++;
40078c68143SDavid Wang     }
40178c68143SDavid Wang     if (k==0) { printf("no cpu event attached at all\n"); return 1; }
40278c68143SDavid Wang 
40378c68143SDavid Wang 	signal(SIGINT, int_exit);
40478c68143SDavid Wang 	signal(SIGTERM, int_exit);
40578c68143SDavid Wang 
40678c68143SDavid Wang     unsigned long long head;
40778c68143SDavid Wang     struct perf_event_mmap_page *mp;
40878c68143SDavid Wang     while (poll(polls, k, -1)>0) {
40978c68143SDavid Wang         // printf("wake\n");
41078c68143SDavid Wang         for (i=0; i<k; i++) {
41178c68143SDavid Wang             if ((polls[i].revents&POLLIN)==0) continue;
41278c68143SDavid Wang             fd = polls[i].fd;
41378c68143SDavid Wang             addr = res[fd].first;
41478c68143SDavid Wang             mp = (struct perf_event_mmap_page *)addr;
41578c68143SDavid Wang             head = res[fd].second;
41678c68143SDavid Wang             if (head==mp->data_head) continue;
41778c68143SDavid Wang             ioctl(fd, PERF_EVENT_IOC_PAUSE_OUTPUT, 1);
41878c68143SDavid Wang             head = mp->data_head-((mp->data_head-head)%mp->data_size);
41978c68143SDavid Wang             while(head<mp->data_head) head+=process_event((char*)addr+mp->data_offset, mp->data_size, head);
42078c68143SDavid Wang             ioctl(fd, PERF_EVENT_IOC_PAUSE_OUTPUT, 0);
42178c68143SDavid Wang             res[fd].second = mp->data_head;
42278c68143SDavid Wang         }
42378c68143SDavid Wang     }
42478c68143SDavid Wang 
42578c68143SDavid Wang     int_exit(0);
42678c68143SDavid Wang     return 0;
42778c68143SDavid Wang }
428