For posterity, here are the results on the Atom N450 running in 32 bit mode:

#############################################################################
# With assembly file
#############################################################################
./speed -s 1-100 -t 1 mpn_sqr_basecase >> atom.tune
overhead 0.000000005 secs, precision 1000000 units of 6.00e-10 secs, CPU 
freq 1667.00 MHz
        mpn_sqr_basecase
1         0.000000013
2         0.000000029
3         0.000000061
4         0.000000117
5         0.000000173
6         0.000000248
7         0.000000320
8         0.000000400
9         0.000000485
10        0.000000578
11        0.000000677
12        0.000000782
13        0.000000906
14        0.000001023
15        0.000001171
16        0.000001302
17        0.000001441
18        0.000001594
19        0.000001747
20        0.000001906
21        0.000002071
22        0.000002242
23        0.000002421
24        0.000002605
25        0.000002797
26        0.000002995
27        0.000003199
28        0.000003411
29        0.000003629
30        0.000003854
31        0.000004087
32        0.000004326
33        0.000004570
34        0.000004821
35        0.000005079
36        0.000005343
37        0.000005613
38        0.000005891
39        0.000006174
40        0.000006465
41        0.000006762
42        0.000007065
43        0.000007376
44        0.000007692
45        0.000008017
46        0.000008347
47        0.000008686
48        0.000009030
49        0.000009380
50        0.000009737
zsh: segmentation fault (core dumped)  ./speed -s 1-100 -t 1 
mpn_sqr_basecase

make tune
./tuneup
Parameters for ./mpn/x86/k7/gmp-mparam.h
Using: CPU cycle counter, supplemented by microsecond getrusage()
speed_precision 1000000, speed_unittime 1.00e-09 secs, CPU freq 1000.00 MHz
DEFAULT_MAX_SIZE 1000, fft_max_size 50000

/* Generated by tuneup.c, 2014-02-17, gcc 4.7 */

#define MUL_KARATSUBA_THRESHOLD          20
#define MUL_TOOM3_THRESHOLD             114
#define MUL_TOOM4_THRESHOLD             184
#define MUL_TOOM8H_THRESHOLD            286

#define SQR_BASECASE_THRESHOLD            0  /* always (native) */
#define SQR_KARATSUBA_THRESHOLD          36
#define SQR_TOOM3_THRESHOLD             117
#define SQR_TOOM4_THRESHOLD             298
#define SQR_TOOM8_THRESHOLD             324

#define POWM_THRESHOLD                  128

#define HGCD_THRESHOLD                  179
#define GCD_DC_THRESHOLD                442
#define GCDEXT_DC_THRESHOLD             309
#define JACOBI_BASE_METHOD                1

#define USE_PREINV_DIVREM_1               1  /* native */
#define USE_PREINV_MOD_1                  1  /* native */
#define DIVREM_2_THRESHOLD                0  /* always */
#define DIVEXACT_1_THRESHOLD              0  /* always (native) */
#define MODEXACT_1_ODD_THRESHOLD          0  /* always (native) */
#define MOD_1_1_THRESHOLD                83
#define MOD_1_2_THRESHOLD               195
#define MOD_1_3_THRESHOLD               502
#define DIVREM_HENSEL_QR_1_THRESHOLD     74
#define RSH_DIVREM_HENSEL_QR_1_THRESHOLD    987
#define DIVREM_EUCLID_HENSEL_THRESHOLD     58

#define ROOTREM_THRESHOLD                 6

#define GET_STR_DC_THRESHOLD             13
#define GET_STR_PRECOMPUTE_THRESHOLD     25
#define SET_STR_DC_THRESHOLD            208
#define SET_STR_PRECOMPUTE_THRESHOLD    272

#define MUL_FFT_FULL_THRESHOLD         3648

#define SQR_FFT_FULL_THRESHOLD         3008

#define MULLOW_BASECASE_THRESHOLD         4
#define MULLOW_DC_THRESHOLD              39
#define MULLOW_MUL_THRESHOLD           2966

#define MULHIGH_BASECASE_THRESHOLD        8
#define MULHIGH_DC_THRESHOLD             39
#define MULHIGH_MUL_THRESHOLD          2908

#define MULMOD_2EXPM1_THRESHOLD          20

#define FAC_UI_THRESHOLD               2849
#define DC_DIV_QR_THRESHOLD              68
#define DC_DIVAPPR_Q_N_THRESHOLD         22
#define INV_DIV_QR_THRESHOLD           2130
#define INV_DIVAPPR_Q_N_THRESHOLD        22
#define DC_DIV_Q_THRESHOLD              225
#define INV_DIV_Q_THRESHOLD            2747
#define DC_DIVAPPR_Q_THRESHOLD          217
#define INV_DIVAPPR_Q_THRESHOLD        7910
#define DC_BDIV_QR_THRESHOLD             68
#define DC_BDIV_Q_THRESHOLD             128

/* fft_tuning -- autogenerated by tune-fft */

#define FFT_TAB \
   { { 3, 3 }, { 3, 2 }, { 2, 1 }, { 1, 0 }, { 1, 0 } }

#define MULMOD_TAB \
   { 4, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1 }

#define FFT_N_NUM 15

#define FFT_MULMOD_2EXPP1_CUTOFF 128


/* Tuneup completed successfully, took 794 seconds */

#############################################################################
# Without assembly file mpn/x86/k7/sqr_basecase.asm
#############################################################################
overhead 0.000000008 secs, precision 1000000 units of 1.00e-09 secs, CPU 
freq 1000.00 MHz
        mpn_sqr_basecase
1         0.000000022
2         0.000000054
3         0.000000136
4         0.000000211
5         0.000000301
6         0.000000407
7         0.000000529
8         0.000000667
9         0.000000850
10        0.000001019
11        0.000001222
12        0.000001438
13        0.000001670
14        0.000002148
15        0.000002227
16        0.000002524
17        0.000002843
18        0.000003155
19        0.000003483
20        0.000003827
21        0.000004187
22        0.000004563
23        0.000004955
24        0.000005363
25        0.000005787
26        0.000006228
27        0.000006684
28        0.000007156
29        0.000007644
30        0.000008148
31        0.000008668
32        0.000009205
33        0.000009757
34        0.000010325
35        0.000010909
36        0.000011509
37        0.000012125
38        0.000012757
39        0.000013405
40        0.000014069
41        0.000014750
42        0.000015446
43        0.000016158
44        0.000016886
45        0.000017631
46        0.000018391
47        0.000019167
48        0.000019959
49        0.000020767
50        0.000021592
51        0.000022432
52        0.000023289
53        0.000024160
54        0.000025048
55        0.000025953
56        0.000026873
57        0.000027809
58        0.000028762
59        0.000029729
60        0.000030713
61        0.000031715
62        0.000032730
63        0.000033763
64        0.000034810
65        0.000035876
66        0.000036955
67        0.000038051
68        0.000039163
69        0.000040292
70        0.000041436
71        0.000042596
72        0.000043772
73        0.000044966
74        0.000046173
75        0.000047397
76        0.000048639
77        0.000049894
78        0.000051166
79        0.000052456
80        0.000053760
81        0.000055080
82        0.000056415
83        0.000057768
84        0.000059137
85        0.000060522
86        0.000061922
87        0.000063338
88        0.000064771
89        0.000066218
90        0.000067682
91        0.000069163
92        0.000070659
93        0.000072172
94        0.000073703
95        0.000075246
96        0.000076805
97        0.000078381
98        0.000079974
99        0.000081581
100       0.000083205

-- 
You received this message because you are subscribed to the Google Groups 
"mpir-devel" group.
To unsubscribe from this group and stop receiving emails from it, send an email 
to mpir-devel+unsubscr...@googlegroups.com.
To post to this group, send email to mpir-devel@googlegroups.com.
Visit this group at http://groups.google.com/group/mpir-devel.
For more options, visit https://groups.google.com/groups/opt_out.

Reply via email to