1+ {
2+ "timestamp" : " 2025-10-20T02:48:59.372463" ,
3+ "device_info" : {
4+ "platform" : " Linux" ,
5+ "device" : " cuda" ,
6+ "ram_gb" : 22.89 ,
7+ "processor" : " Intel(R) Core(TM) Ultra 9 185H (16)" ,
8+ "gpu_name" : " NVIDIA GeForce RTX 4060 Laptop GPU" ,
9+ "gpu_memory_gb" : 7.62 ,
10+ "host" : " ASUSTeK COMPUTER INC. ASUS Vivobook Pro 15 N6506MV_N6506MV 1.0" ,
11+ "cuda_version" : " 12.8"
12+ },
13+ "tasks" : [
14+ {
15+ "task" : " embeddings" ,
16+ "dataset_size" : 100 ,
17+ "models" : {
18+ "thenlper/gte-large" : {
19+ "model_name" : " thenlper/gte-large" ,
20+ "batch_size" : 16 ,
21+ "max_seq_length" : 512 ,
22+ "embedding_dimension" : 1024 ,
23+ "device" : " cuda:0" ,
24+ "dtype" : " torch.float32" ,
25+ "actual_dataset_size" : 100 ,
26+ "num_runs" : 3 ,
27+ "runs" : [
28+ {
29+ "run" : 1 ,
30+ "encoding_time_seconds" : 3.91 ,
31+ "rows_per_second" : 25.57
32+ },
33+ {
34+ "run" : 2 ,
35+ "encoding_time_seconds" : 3.86 ,
36+ "rows_per_second" : 25.89
37+ },
38+ {
39+ "run" : 3 ,
40+ "encoding_time_seconds" : 3.95 ,
41+ "rows_per_second" : 25.3
42+ }
43+ ],
44+ "median_encoding_time_seconds" : 3.91 ,
45+ "median_rows_per_second" : 25.57
46+ },
47+ "nomic-ai/modernbert-embed-base" : {
48+ "model_name" : " nomic-ai/modernbert-embed-base" ,
49+ "batch_size" : 16 ,
50+ "max_seq_length" : 8192 ,
51+ "embedding_dimension" : 768 ,
52+ "device" : " cuda:0" ,
53+ "dtype" : " torch.float32" ,
54+ "actual_dataset_size" : 100 ,
55+ "num_runs" : 3 ,
56+ "runs" : [
57+ {
58+ "run" : 1 ,
59+ "encoding_time_seconds" : 2.72 ,
60+ "rows_per_second" : 36.78
61+ },
62+ {
63+ "run" : 2 ,
64+ "encoding_time_seconds" : 2.76 ,
65+ "rows_per_second" : 36.24
66+ },
67+ {
68+ "run" : 3 ,
69+ "encoding_time_seconds" : 2.79 ,
70+ "rows_per_second" : 35.9
71+ }
72+ ],
73+ "median_encoding_time_seconds" : 2.76 ,
74+ "median_rows_per_second" : 36.24
75+ }
76+ },
77+ "task_score" : 539.7301
78+ },
79+ {
80+ "task" : " llms" ,
81+ "dataset" : " awesome-chatgpt-prompts" ,
82+ "num_prompts" : 3 ,
83+ "model" : {
84+ "model_name" : " gpt-oss-20b" ,
85+ "num_prompts" : 3 ,
86+ "num_runs" : 3 ,
87+ "runs" : [
88+ {
89+ "run" : 1 ,
90+ "median_latency_s" : 123.0658 ,
91+ "median_ttft_s" : 21.2746 ,
92+ "median_tokens_per_sec" : 15.3862 ,
93+ "total_input_tokens" : 561 ,
94+ "total_output_tokens" : 3443
95+ },
96+ {
97+ "run" : 2 ,
98+ "median_latency_s" : 136.2836 ,
99+ "median_ttft_s" : 27.8911 ,
100+ "median_tokens_per_sec" : 16.7172 ,
101+ "total_input_tokens" : 561 ,
102+ "total_output_tokens" : 3625
103+ },
104+ {
105+ "run" : 3 ,
106+ "median_latency_s" : 136.6311 ,
107+ "median_ttft_s" : 27.8711 ,
108+ "median_tokens_per_sec" : 16.7022 ,
109+ "total_input_tokens" : 561 ,
110+ "total_output_tokens" : 3625
111+ }
112+ ],
113+ "final_median_latency_s" : 136.2836 ,
114+ "final_median_ttft_s" : 27.8711 ,
115+ "final_median_tokens_per_sec" : 16.7022
116+ },
117+ "task_score" : 26.4155
118+ }
119+ ]
120+ }
0 commit comments