forked from phacility/xhprof
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathxhprof.c
2052 lines (1752 loc) · 57.9 KB
/
xhprof.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
/*
* Copyright (c) 2009 Facebook
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
*/
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#ifdef linux
/* To enable CPU_ZERO and CPU_SET, etc. */
# define _GNU_SOURCE
#endif
#include "php.h"
#include "php_ini.h"
#include "ext/standard/info.h"
#include "php_xhprof.h"
#include "zend_extensions.h"
#include <sys/time.h>
#include <sys/resource.h>
#include <stdlib.h>
#include <unistd.h>
#ifdef __FreeBSD__
# if __FreeBSD_version >= 700110
# include <sys/resource.h>
# include <sys/cpuset.h>
# define cpu_set_t cpuset_t
# define SET_AFFINITY(pid, size, mask) \
cpuset_setaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, size, mask)
# define GET_AFFINITY(pid, size, mask) \
cpuset_getaffinity(CPU_LEVEL_WHICH, CPU_WHICH_TID, -1, size, mask)
# else
# error "This version of FreeBSD does not support cpusets"
# endif /* __FreeBSD_version */
#elif __APPLE__
/*
* Patch for compiling in Mac OS X Leopard
* @author Svilen Spasov <s.spasov@gmail.com>
*/
# include <mach/mach_init.h>
# include <mach/thread_policy.h>
# define cpu_set_t thread_affinity_policy_data_t
# define CPU_SET(cpu_id, new_mask) \
(*(new_mask)).affinity_tag = (cpu_id + 1)
# define CPU_ZERO(new_mask) \
(*(new_mask)).affinity_tag = THREAD_AFFINITY_TAG_NULL
# define SET_AFFINITY(pid, size, mask) \
thread_policy_set(mach_thread_self(), THREAD_AFFINITY_POLICY, mask, \
THREAD_AFFINITY_POLICY_COUNT)
#else
/* For sched_getaffinity, sched_setaffinity */
# include <sched.h>
# define SET_AFFINITY(pid, size, mask) sched_setaffinity(0, size, mask)
# define GET_AFFINITY(pid, size, mask) sched_getaffinity(0, size, mask)
#endif /* __FreeBSD__ */
/**
* **********************
* GLOBAL MACRO CONSTANTS
* **********************
*/
/* XHProf version */
#define XHPROF_VERSION "0.9.2"
/* Fictitious function name to represent top of the call tree. The paranthesis
* in the name is to ensure we don't conflict with user function names. */
#define ROOT_SYMBOL "main()"
/* Size of a temp scratch buffer */
#define SCRATCH_BUF_LEN 512
/* Various XHPROF modes. If you are adding a new mode, register the appropriate
* callbacks in hp_begin() */
#define XHPROF_MODE_HIERARCHICAL 1
#define XHPROF_MODE_SAMPLED 620002 /* Rockfort's zip code */
/* Hierarchical profiling flags.
*
* Note: Function call counts and wall (elapsed) time are always profiled.
* The following optional flags can be used to control other aspects of
* profiling.
*/
#define XHPROF_FLAGS_NO_BUILTINS 0x0001 /* do not profile builtins */
#define XHPROF_FLAGS_CPU 0x0002 /* gather CPU times for funcs */
#define XHPROF_FLAGS_MEMORY 0x0004 /* gather memory usage for funcs */
/* Constants for XHPROF_MODE_SAMPLED */
#define XHPROF_SAMPLING_INTERVAL 100000 /* In microsecs */
/* Constant for ignoring functions, transparent to hierarchical profile */
#define XHPROF_MAX_IGNORED_FUNCTIONS 256
#define XHPROF_IGNORED_FUNCTION_FILTER_SIZE \
((XHPROF_MAX_IGNORED_FUNCTIONS + 7)/8)
#if !defined(uint64)
typedef unsigned long long uint64;
#endif
#if !defined(uint32)
typedef unsigned int uint32;
#endif
#if !defined(uint8)
typedef unsigned char uint8;
#endif
/**
* *****************************
* GLOBAL DATATYPES AND TYPEDEFS
* *****************************
*/
/* XHProf maintains a stack of entries being profiled. The memory for the entry
* is passed by the layer that invokes BEGIN_PROFILING(), e.g. the hp_execute()
* function. Often, this is just C-stack memory.
*
* This structure is a convenient place to track start time of a particular
* profile operation, recursion depth, and the name of the function being
* profiled. */
typedef struct hp_entry_t {
char *name_hprof; /* function name */
int rlvl_hprof; /* recursion level for function */
uint64 tsc_start; /* start value for TSC counter */
long int mu_start_hprof; /* memory usage */
long int pmu_start_hprof; /* peak memory usage */
struct rusage ru_start_hprof; /* user/sys time start */
struct hp_entry_t *prev_hprof; /* ptr to prev entry being profiled */
uint8 hash_code; /* hash_code for the function name */
} hp_entry_t;
/* Various types for XHPROF callbacks */
typedef void (*hp_init_cb) (TSRMLS_D);
typedef void (*hp_exit_cb) (TSRMLS_D);
typedef void (*hp_begin_function_cb) (hp_entry_t **entries,
hp_entry_t *current TSRMLS_DC);
typedef void (*hp_end_function_cb) (hp_entry_t **entries TSRMLS_DC);
/* Struct to hold the various callbacks for a single xhprof mode */
typedef struct hp_mode_cb {
hp_init_cb init_cb;
hp_exit_cb exit_cb;
hp_begin_function_cb begin_fn_cb;
hp_end_function_cb end_fn_cb;
} hp_mode_cb;
/* Xhprof's global state.
*
* This structure is instantiated once. Initialize defaults for attributes in
* hp_init_profiler_state() Cleanup/free attributes in
* hp_clean_profiler_state() */
typedef struct hp_global_t {
/* ---------- Global attributes: ----------- */
/* Indicates if xhprof is currently enabled */
int enabled;
/* Indicates if xhprof was ever enabled during this request */
int ever_enabled;
/* Holds all the xhprof statistics */
zval *stats_count;
/* Indicates the current xhprof mode or level */
int profiler_level;
/* Top of the profile stack */
hp_entry_t *entries;
/* freelist of hp_entry_t chunks for reuse... */
hp_entry_t *entry_free_list;
/* Callbacks for various xhprof modes */
hp_mode_cb mode_cb;
/* ---------- Mode specific attributes: ----------- */
/* Global to track the time of the last sample in time and ticks */
struct timeval last_sample_time;
uint64 last_sample_tsc;
/* XHPROF_SAMPLING_INTERVAL in ticks */
uint64 sampling_interval_tsc;
/* This array is used to store cpu frequencies for all available logical
* cpus. For now, we assume the cpu frequencies will not change for power
* saving or other reasons. If we need to worry about that in the future, we
* can use a periodical timer to re-calculate this arrary every once in a
* while (for example, every 1 or 5 seconds). */
double *cpu_frequencies;
/* The number of logical CPUs this machine has. */
uint32 cpu_num;
/* The saved cpu affinity. */
cpu_set_t prev_mask;
/* The cpu id current process is bound to. (default 0) */
uint32 cur_cpu_id;
/* XHProf flags */
uint32 xhprof_flags;
/* counter table indexed by hash value of function names. */
uint8 func_hash_counters[256];
/* Table of ignored function names and their filter */
char **ignored_function_names;
uint8 ignored_function_filter[XHPROF_IGNORED_FUNCTION_FILTER_SIZE];
} hp_global_t;
/**
* ***********************
* GLOBAL STATIC VARIABLES
* ***********************
*/
/* XHProf global state */
static hp_global_t hp_globals;
#if PHP_VERSION_ID < 50500
/* Pointer to the original execute function */
static ZEND_DLEXPORT void (*_zend_execute) (zend_op_array *ops TSRMLS_DC);
/* Pointer to the origianl execute_internal function */
static ZEND_DLEXPORT void (*_zend_execute_internal) (zend_execute_data *data,
int ret TSRMLS_DC);
#else
/* Pointer to the original execute function */
static void (*_zend_execute_ex) (zend_execute_data *execute_data TSRMLS_DC);
/* Pointer to the origianl execute_internal function */
static void (*_zend_execute_internal) (zend_execute_data *data,
struct _zend_fcall_info *fci, int ret TSRMLS_DC);
#endif
/* Pointer to the original compile function */
static zend_op_array * (*_zend_compile_file) (zend_file_handle *file_handle,
int type TSRMLS_DC);
/* Pointer to the original compile string function (used by eval) */
static zend_op_array * (*_zend_compile_string) (zval *source_string, char *filename TSRMLS_DC);
/* Bloom filter for function names to be ignored */
#define INDEX_2_BYTE(index) (index >> 3)
#define INDEX_2_BIT(index) (1 << (index & 0x7));
/**
* ****************************
* STATIC FUNCTION DECLARATIONS
* ****************************
*/
static void hp_register_constants(INIT_FUNC_ARGS);
static void hp_begin(long level, long xhprof_flags TSRMLS_DC);
static void hp_stop(TSRMLS_D);
static void hp_end(TSRMLS_D);
static inline uint64 cycle_timer();
static double get_cpu_frequency();
static void clear_frequencies();
static void hp_free_the_free_list();
static hp_entry_t *hp_fast_alloc_hprof_entry();
static void hp_fast_free_hprof_entry(hp_entry_t *p);
static inline uint8 hp_inline_hash(char * str);
static void get_all_cpu_frequencies();
static long get_us_interval(struct timeval *start, struct timeval *end);
static void incr_us_interval(struct timeval *start, uint64 incr);
static void hp_get_ignored_functions_from_arg(zval *args);
static void hp_ignored_functions_filter_clear();
static void hp_ignored_functions_filter_init();
static inline zval *hp_zval_at_key(char *key,
zval *values);
static inline char **hp_strings_in_zval(zval *values);
static inline void hp_array_del(char **name_array);
/* {{{ arginfo */
ZEND_BEGIN_ARG_INFO_EX(arginfo_xhprof_enable, 0, 0, 0)
ZEND_ARG_INFO(0, flags)
ZEND_ARG_INFO(0, options)
ZEND_END_ARG_INFO()
ZEND_BEGIN_ARG_INFO(arginfo_xhprof_disable, 0)
ZEND_END_ARG_INFO()
ZEND_BEGIN_ARG_INFO(arginfo_xhprof_sample_enable, 0)
ZEND_END_ARG_INFO()
ZEND_BEGIN_ARG_INFO(arginfo_xhprof_sample_disable, 0)
ZEND_END_ARG_INFO()
/* }}} */
/**
* *********************
* FUNCTION PROTOTYPES
* *********************
*/
int restore_cpu_affinity(cpu_set_t * prev_mask);
int bind_to_cpu(uint32 cpu_id);
/**
* *********************
* PHP EXTENSION GLOBALS
* *********************
*/
/* List of functions implemented/exposed by xhprof */
zend_function_entry xhprof_functions[] = {
PHP_FE(xhprof_enable, arginfo_xhprof_enable)
PHP_FE(xhprof_disable, arginfo_xhprof_disable)
PHP_FE(xhprof_sample_enable, arginfo_xhprof_sample_enable)
PHP_FE(xhprof_sample_disable, arginfo_xhprof_sample_disable)
{NULL, NULL, NULL}
};
/* Callback functions for the xhprof extension */
zend_module_entry xhprof_module_entry = {
#if ZEND_MODULE_API_NO >= 20010901
STANDARD_MODULE_HEADER,
#endif
"xhprof", /* Name of the extension */
xhprof_functions, /* List of functions exposed */
PHP_MINIT(xhprof), /* Module init callback */
PHP_MSHUTDOWN(xhprof), /* Module shutdown callback */
PHP_RINIT(xhprof), /* Request init callback */
PHP_RSHUTDOWN(xhprof), /* Request shutdown callback */
PHP_MINFO(xhprof), /* Module info callback */
#if ZEND_MODULE_API_NO >= 20010901
XHPROF_VERSION,
#endif
STANDARD_MODULE_PROPERTIES
};
PHP_INI_BEGIN()
/* output directory:
* Currently this is not used by the extension itself.
* But some implementations of iXHProfRuns interface might
* choose to save/restore XHProf profiler runs in the
* directory specified by this ini setting.
*/
PHP_INI_ENTRY("xhprof.output_dir", "", PHP_INI_ALL, NULL)
PHP_INI_END()
/* Init module */
ZEND_GET_MODULE(xhprof)
/**
* **********************************
* PHP EXTENSION FUNCTION DEFINITIONS
* **********************************
*/
/**
* Start XHProf profiling in hierarchical mode.
*
* @param long $flags flags for hierarchical mode
* @return void
* @author kannan
*/
PHP_FUNCTION(xhprof_enable) {
long xhprof_flags = 0; /* XHProf flags */
zval *optional_array = NULL; /* optional array arg: for future use */
if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC,
"|lz", &xhprof_flags, &optional_array) == FAILURE) {
return;
}
hp_get_ignored_functions_from_arg(optional_array);
hp_begin(XHPROF_MODE_HIERARCHICAL, xhprof_flags TSRMLS_CC);
}
/**
* Stops XHProf from profiling in hierarchical mode anymore and returns the
* profile info.
*
* @param void
* @return array hash-array of XHProf's profile info
* @author kannan, hzhao
*/
PHP_FUNCTION(xhprof_disable) {
if (hp_globals.enabled) {
hp_stop(TSRMLS_C);
RETURN_ZVAL(hp_globals.stats_count, 1, 0);
}
/* else null is returned */
}
/**
* Start XHProf profiling in sampling mode.
*
* @return void
* @author cjiang
*/
PHP_FUNCTION(xhprof_sample_enable) {
long xhprof_flags = 0; /* XHProf flags */
hp_get_ignored_functions_from_arg(NULL);
hp_begin(XHPROF_MODE_SAMPLED, xhprof_flags TSRMLS_CC);
}
/**
* Stops XHProf from profiling in sampling mode anymore and returns the profile
* info.
*
* @param void
* @return array hash-array of XHProf's profile info
* @author cjiang
*/
PHP_FUNCTION(xhprof_sample_disable) {
if (hp_globals.enabled) {
hp_stop(TSRMLS_C);
RETURN_ZVAL(hp_globals.stats_count, 1, 0);
}
/* else null is returned */
}
/**
* Module init callback.
*
* @author cjiang
*/
PHP_MINIT_FUNCTION(xhprof) {
int i;
REGISTER_INI_ENTRIES();
hp_register_constants(INIT_FUNC_ARGS_PASSTHRU);
/* Get the number of available logical CPUs. */
hp_globals.cpu_num = sysconf(_SC_NPROCESSORS_CONF);
/* Get the cpu affinity mask. */
#ifndef __APPLE__
if (GET_AFFINITY(0, sizeof(cpu_set_t), &hp_globals.prev_mask) < 0) {
perror("getaffinity");
return FAILURE;
}
#else
CPU_ZERO(&(hp_globals.prev_mask));
#endif
/* Initialize cpu_frequencies and cur_cpu_id. */
hp_globals.cpu_frequencies = NULL;
hp_globals.cur_cpu_id = 0;
hp_globals.stats_count = NULL;
/* no free hp_entry_t structures to start with */
hp_globals.entry_free_list = NULL;
for (i = 0; i < 256; i++) {
hp_globals.func_hash_counters[i] = 0;
}
hp_ignored_functions_filter_clear();
#if defined(DEBUG)
/* To make it random number generator repeatable to ease testing. */
srand(0);
#endif
return SUCCESS;
}
/**
* Module shutdown callback.
*/
PHP_MSHUTDOWN_FUNCTION(xhprof) {
/* Make sure cpu_frequencies is free'ed. */
clear_frequencies();
/* free any remaining items in the free list */
hp_free_the_free_list();
UNREGISTER_INI_ENTRIES();
return SUCCESS;
}
/**
* Request init callback. Nothing to do yet!
*/
PHP_RINIT_FUNCTION(xhprof) {
return SUCCESS;
}
/**
* Request shutdown callback. Stop profiling and return.
*/
PHP_RSHUTDOWN_FUNCTION(xhprof) {
hp_end(TSRMLS_C);
return SUCCESS;
}
/**
* Module info callback. Returns the xhprof version.
*/
PHP_MINFO_FUNCTION(xhprof)
{
char buf[SCRATCH_BUF_LEN];
char tmp[SCRATCH_BUF_LEN];
int i;
int len;
php_info_print_table_start();
php_info_print_table_header(2, "xhprof", XHPROF_VERSION);
len = snprintf(buf, SCRATCH_BUF_LEN, "%d", hp_globals.cpu_num);
buf[len] = 0;
php_info_print_table_header(2, "CPU num", buf);
if (hp_globals.cpu_frequencies) {
/* Print available cpu frequencies here. */
php_info_print_table_header(2, "CPU logical id", " Clock Rate (MHz) ");
for (i = 0; i < hp_globals.cpu_num; ++i) {
len = snprintf(buf, SCRATCH_BUF_LEN, " CPU %d ", i);
buf[len] = 0;
len = snprintf(tmp, SCRATCH_BUF_LEN, "%f", hp_globals.cpu_frequencies[i]);
tmp[len] = 0;
php_info_print_table_row(2, buf, tmp);
}
}
php_info_print_table_end();
}
/**
* ***************************************************
* COMMON HELPER FUNCTION DEFINITIONS AND LOCAL MACROS
* ***************************************************
*/
static void hp_register_constants(INIT_FUNC_ARGS) {
REGISTER_LONG_CONSTANT("XHPROF_FLAGS_NO_BUILTINS",
XHPROF_FLAGS_NO_BUILTINS,
CONST_CS | CONST_PERSISTENT);
REGISTER_LONG_CONSTANT("XHPROF_FLAGS_CPU",
XHPROF_FLAGS_CPU,
CONST_CS | CONST_PERSISTENT);
REGISTER_LONG_CONSTANT("XHPROF_FLAGS_MEMORY",
XHPROF_FLAGS_MEMORY,
CONST_CS | CONST_PERSISTENT);
}
/**
* A hash function to calculate a 8-bit hash code for a function name.
* This is based on a small modification to 'zend_inline_hash_func' by summing
* up all bytes of the ulong returned by 'zend_inline_hash_func'.
*
* @param str, char *, string to be calculated hash code for.
*
* @author cjiang
*/
static inline uint8 hp_inline_hash(char * str) {
ulong h = 5381;
uint i = 0;
uint8 res = 0;
while (*str) {
h += (h << 5);
h ^= (ulong) *str++;
}
for (i = 0; i < sizeof(ulong); i++) {
res += ((uint8 *)&h)[i];
}
return res;
}
/**
* Parse the list of ignored functions from the zval argument.
*
* @author mpal
*/
static void hp_get_ignored_functions_from_arg(zval *args) {
if (hp_globals.ignored_function_names) {
hp_array_del(hp_globals.ignored_function_names);
}
if (args != NULL) {
zval *zresult = NULL;
zresult = hp_zval_at_key("ignored_functions", args);
hp_globals.ignored_function_names = hp_strings_in_zval(zresult);
} else {
hp_globals.ignored_function_names = NULL;
}
}
/**
* Clear filter for functions which may be ignored during profiling.
*
* @author mpal
*/
static void hp_ignored_functions_filter_clear() {
memset(hp_globals.ignored_function_filter, 0,
XHPROF_IGNORED_FUNCTION_FILTER_SIZE);
}
/**
* Initialize filter for ignored functions using bit vector.
*
* @author mpal
*/
static void hp_ignored_functions_filter_init() {
if (hp_globals.ignored_function_names != NULL) {
int i = 0;
for(; hp_globals.ignored_function_names[i] != NULL; i++) {
char *str = hp_globals.ignored_function_names[i];
uint8 hash = hp_inline_hash(str);
int idx = INDEX_2_BYTE(hash);
hp_globals.ignored_function_filter[idx] |= INDEX_2_BIT(hash);
}
}
}
/**
* Check if function collides in filter of functions to be ignored.
*
* @author mpal
*/
int hp_ignored_functions_filter_collision(uint8 hash) {
uint8 mask = INDEX_2_BIT(hash);
return hp_globals.ignored_function_filter[INDEX_2_BYTE(hash)] & mask;
}
/**
* Initialize profiler state
*
* @author kannan, veeve
*/
void hp_init_profiler_state(int level TSRMLS_DC) {
/* Setup globals */
if (!hp_globals.ever_enabled) {
hp_globals.ever_enabled = 1;
hp_globals.entries = NULL;
}
hp_globals.profiler_level = (int) level;
/* Init stats_count */
if (hp_globals.stats_count) {
zval_dtor(hp_globals.stats_count);
FREE_ZVAL(hp_globals.stats_count);
}
MAKE_STD_ZVAL(hp_globals.stats_count);
array_init(hp_globals.stats_count);
/* NOTE(cjiang): some fields such as cpu_frequencies take relatively longer
* to initialize, (5 milisecond per logical cpu right now), therefore we
* calculate them lazily. */
if (hp_globals.cpu_frequencies == NULL) {
get_all_cpu_frequencies();
restore_cpu_affinity(&hp_globals.prev_mask);
}
/* bind to a random cpu so that we can use rdtsc instruction. */
bind_to_cpu((int) (rand() % hp_globals.cpu_num));
/* Call current mode's init cb */
hp_globals.mode_cb.init_cb(TSRMLS_C);
/* Set up filter of functions which may be ignored during profiling */
hp_ignored_functions_filter_init();
}
/**
* Cleanup profiler state
*
* @author kannan, veeve
*/
void hp_clean_profiler_state(TSRMLS_D) {
/* Call current mode's exit cb */
hp_globals.mode_cb.exit_cb(TSRMLS_C);
/* Clear globals */
if (hp_globals.stats_count) {
zval_dtor(hp_globals.stats_count);
FREE_ZVAL(hp_globals.stats_count);
hp_globals.stats_count = NULL;
}
hp_globals.entries = NULL;
hp_globals.profiler_level = 1;
hp_globals.ever_enabled = 0;
/* Delete the array storing ignored function names */
hp_array_del(hp_globals.ignored_function_names);
hp_globals.ignored_function_names = NULL;
}
/*
* Start profiling - called just before calling the actual function
* NOTE: PLEASE MAKE SURE TSRMLS_CC IS AVAILABLE IN THE CONTEXT
* OF THE FUNCTION WHERE THIS MACRO IS CALLED.
* TSRMLS_CC CAN BE MADE AVAILABLE VIA TSRMLS_DC IN THE
* CALLING FUNCTION OR BY CALLING TSRMLS_FETCH()
* TSRMLS_FETCH() IS RELATIVELY EXPENSIVE.
*/
#define BEGIN_PROFILING(entries, symbol, profile_curr) \
do { \
/* Use a hash code to filter most of the string comparisons. */ \
uint8 hash_code = hp_inline_hash(symbol); \
profile_curr = !hp_ignore_entry(hash_code, symbol); \
if (profile_curr) { \
hp_entry_t *cur_entry = hp_fast_alloc_hprof_entry(); \
(cur_entry)->hash_code = hash_code; \
(cur_entry)->name_hprof = symbol; \
(cur_entry)->prev_hprof = (*(entries)); \
/* Call the universal callback */ \
hp_mode_common_beginfn((entries), (cur_entry) TSRMLS_CC); \
/* Call the mode's beginfn callback */ \
hp_globals.mode_cb.begin_fn_cb((entries), (cur_entry) TSRMLS_CC); \
/* Update entries linked list */ \
(*(entries)) = (cur_entry); \
} \
} while (0)
/*
* Stop profiling - called just after calling the actual function
* NOTE: PLEASE MAKE SURE TSRMLS_CC IS AVAILABLE IN THE CONTEXT
* OF THE FUNCTION WHERE THIS MACRO IS CALLED.
* TSRMLS_CC CAN BE MADE AVAILABLE VIA TSRMLS_DC IN THE
* CALLING FUNCTION OR BY CALLING TSRMLS_FETCH()
* TSRMLS_FETCH() IS RELATIVELY EXPENSIVE.
*/
#define END_PROFILING(entries, profile_curr) \
do { \
if (profile_curr) { \
hp_entry_t *cur_entry; \
/* Call the mode's endfn callback. */ \
/* NOTE(cjiang): we want to call this 'end_fn_cb' before */ \
/* 'hp_mode_common_endfn' to avoid including the time in */ \
/* 'hp_mode_common_endfn' in the profiling results. */ \
hp_globals.mode_cb.end_fn_cb((entries) TSRMLS_CC); \
cur_entry = (*(entries)); \
/* Call the universal callback */ \
hp_mode_common_endfn((entries), (cur_entry) TSRMLS_CC); \
/* Free top entry and update entries linked list */ \
(*(entries)) = (*(entries))->prev_hprof; \
hp_fast_free_hprof_entry(cur_entry); \
} \
} while (0)
/**
* Returns formatted function name
*
* @param entry hp_entry
* @param result_buf ptr to result buf
* @param result_len max size of result buf
* @return total size of the function name returned in result_buf
* @author veeve
*/
size_t hp_get_entry_name(hp_entry_t *entry,
char *result_buf,
size_t result_len) {
/* Validate result_len */
if (result_len <= 1) {
/* Insufficient result_bug. Bail! */
return 0;
}
/* Add '@recurse_level' if required */
/* NOTE: Dont use snprintf's return val as it is compiler dependent */
if (entry->rlvl_hprof) {
snprintf(result_buf, result_len,
"%s@%d",
entry->name_hprof, entry->rlvl_hprof);
}
else {
snprintf(result_buf, result_len,
"%s",
entry->name_hprof);
}
/* Force null-termination at MAX */
result_buf[result_len - 1] = 0;
return strlen(result_buf);
}
/**
* Check if this entry should be ignored, first with a conservative Bloomish
* filter then with an exact check against the function names.
*
* @author mpal
*/
int hp_ignore_entry_work(uint8 hash_code, char *curr_func) {
int ignore = 0;
if (hp_ignored_functions_filter_collision(hash_code)) {
int i = 0;
for (; hp_globals.ignored_function_names[i] != NULL; i++) {
char *name = hp_globals.ignored_function_names[i];
if ( !strcmp(curr_func, name)) {
ignore++;
break;
}
}
}
return ignore;
}
static inline int hp_ignore_entry(uint8 hash_code, char *curr_func) {
/* First check if ignoring functions is enabled */
return hp_globals.ignored_function_names != NULL &&
hp_ignore_entry_work(hash_code, curr_func);
}
/**
* Build a caller qualified name for a callee.
*
* For example, if A() is caller for B(), then it returns "A==>B".
* Recursive invokations are denoted with @<n> where n is the recursion
* depth.
*
* For example, "foo==>foo@1", and "foo@2==>foo@3" are examples of direct
* recursion. And "bar==>foo@1" is an example of an indirect recursive
* call to foo (implying the foo() is on the call stack some levels
* above).
*
* @author kannan, veeve
*/
size_t hp_get_function_stack(hp_entry_t *entry,
int level,
char *result_buf,
size_t result_len) {
size_t len = 0;
/* End recursion if we dont need deeper levels or we dont have any deeper
* levels */
if (!entry->prev_hprof || (level <= 1)) {
return hp_get_entry_name(entry, result_buf, result_len);
}
/* Take care of all ancestors first */
len = hp_get_function_stack(entry->prev_hprof,
level - 1,
result_buf,
result_len);
/* Append the delimiter */
# define HP_STACK_DELIM "==>"
# define HP_STACK_DELIM_LEN (sizeof(HP_STACK_DELIM) - 1)
if (result_len < (len + HP_STACK_DELIM_LEN)) {
/* Insufficient result_buf. Bail out! */
return len;
}
/* Add delimiter only if entry had ancestors */
if (len) {
strncat(result_buf + len,
HP_STACK_DELIM,
result_len - len);
len += HP_STACK_DELIM_LEN;
}
# undef HP_STACK_DELIM_LEN
# undef HP_STACK_DELIM
/* Append the current function name */
return len + hp_get_entry_name(entry,
result_buf + len,
result_len - len);
}
/**
* Takes an input of the form /a/b/c/d/foo.php and returns
* a pointer to one-level directory and basefile name
* (d/foo.php) in the same string.
*/
static const char *hp_get_base_filename(const char *filename) {
const char *ptr;
int found = 0;
if (!filename)
return "";
/* reverse search for "/" and return a ptr to the next char */
for (ptr = filename + strlen(filename) - 1; ptr >= filename; ptr--) {
if (*ptr == '/') {
found++;
}
if (found == 2) {
return ptr + 1;
}
}
/* no "/" char found, so return the whole string */
return filename;
}
/**
* Get the name of the current function. The name is qualified with
* the class name if the function is in a class.
*
* @author kannan, hzhao
*/
static char *hp_get_function_name(zend_op_array *ops TSRMLS_DC) {
zend_execute_data *data;
const char *func = NULL;
const char *cls = NULL;
char *ret = NULL;
int len;
zend_function *curr_func;
data = EG(current_execute_data);
if (data) {
/* shared meta data for function on the call stack */
curr_func = data->function_state.function;
/* extract function name from the meta info */
func = curr_func->common.function_name;
if (func) {
/* previously, the order of the tests in the "if" below was
* flipped, leading to incorrect function names in profiler
* reports. When a method in a super-type is invoked the
* profiler should qualify the function name with the super-type
* class name (not the class name based on the run-time type
* of the object.
*/
if (curr_func->common.scope) {
cls = curr_func->common.scope->name;
} else if (data->object) {
cls = Z_OBJCE(*data->object)->name;
}
if (cls) {
len = strlen(cls) + strlen(func) + 10;
ret = (char*)emalloc(len);
snprintf(ret, len, "%s::%s", cls, func);
} else {
ret = estrdup(func);
}
} else {
long curr_op;
int add_filename = 0;
/* we are dealing with a special directive/function like
* include, eval, etc.
*/
#if ZEND_EXTENSION_API_NO >= 220121212
if (data->prev_execute_data) {
curr_op = data->prev_execute_data->opline->extended_value;
} else {
curr_op = data->opline->extended_value;
}
#elif ZEND_EXTENSION_API_NO >= 220100525
curr_op = data->opline->extended_value;
#else
curr_op = data->opline->op2.u.constant.value.lval;
#endif
switch (curr_op) {
case ZEND_EVAL:
func = "eval";
break;
case ZEND_INCLUDE:
func = "include";
add_filename = 1;
break;
case ZEND_REQUIRE:
func = "require";
add_filename = 1;
break;
case ZEND_INCLUDE_ONCE:
func = "include_once";
add_filename = 1;
break;
case ZEND_REQUIRE_ONCE:
func = "require_once";
add_filename = 1;
break;