chore(reports): Phase 1/2 baseline + 2026-04~05 평가·관측 자료 보존
Phase 1.1a~1.3 / Phase 2.1~2.3 평가셋 측정 결과 + regression baseline + D9 STT 후속 VRAM 피크 관측 데이터. project_search_v2 메모리에 Phase 2 평가셋 v0.2 baseline용 보존 명시.
This commit is contained in:
@@ -0,0 +1,24 @@
|
||||
label,id,category,intent,domain_hint,query,relevant_ids,returned_ids_top10,latency_ms,recall_at_10,mrr_at_10,ndcg_at_10,top3_hit,error
|
||||
single,kw_001,exact_keyword,fact_lookup,document,산업안전보건법 제6장,3856;3868;3879,3856;3851;3876;3862;3853;3861;3879;3868;3873;3871,183.6,1.000,1.000,0.774,1,
|
||||
single,kw_002,exact_keyword,fact_lookup,document,중대재해 처벌 등에 관한 법률 제2장 중대산업재해,3917;3921,3921;3923;3917;3922;3918;3920;3919;3916;3874;3854,172.2,1.000,1.000,0.920,1,
|
||||
single,kw_003,exact_keyword,fact_lookup,document,화학물질관리법 유해화학물질 영업자,3981,3981;3980;3985;3978;3983;3979;3857;3880;3903;3984,151.1,1.000,1.000,1.000,1,
|
||||
single,kw_004,exact_keyword,fact_lookup,document,근로기준법 안전과 보건,4041,4041;3851;4042;3852;4044;3905;4043;3877;4040;3875,140.1,1.000,1.000,1.000,1,
|
||||
single,kw_005,exact_keyword,fact_lookup,document,산업안전보건기준에 관한 규칙 보호구,3888,3897;3890;3901;3910;3888;3898;3885;3892;3891;3887,162.0,1.000,0.200,0.387,0,
|
||||
single,nl_001,natural_language_ko,semantic_search,document,기계로 인한 산업재해 관련 법령,3856;3868;3879;3854,3897;3878;3851;3856;3868;3895;3879;3863;3874;3855,132.3,0.750,0.250,0.449,0,
|
||||
single,nl_002,natural_language_ko,semantic_search,document,사업주가 도급을 줄 때 산업재해를 예방하기 위해 해야 할 일,3855;3867;3878,3855;3917;3867;3854;3896;3895;3851;3903;3908;3897,151.4,0.667,1.000,0.704,1,
|
||||
single,nl_003,natural_language_ko,semantic_search,document,유해화학물질을 다루는 회사가 지켜야 할 안전 의무,3980;3981;3982,3980;3855;3985;3760;3910;3904;3757;3896;3903;3909,134.3,0.333,1.000,0.469,1,
|
||||
single,nl_004,natural_language_ko,semantic_search,document,중대재해가 발생했을 때 경영책임자가 처벌받는 기준,3916;3917;3920;3921,3917;3918;3854;3877;3872;3984;3916;3919;3867;3922,136.5,0.500,1.000,0.521,1,
|
||||
single,nl_005,natural_language_ko,semantic_search,document,안전보건교육은 누가 받아야 하고 어떤 내용을 다루는가,3853;3865,3853;4025;3876;3757;3787;3811;3778;3810;3818;3880,148.4,0.500,1.000,0.613,1,
|
||||
single,cl_001,crosslingual_ko_en,semantic_search,document,기계 안전 가드 설계 원리,3770;3856,3770;4540;3817;4548;3758;3791;3774;3789;3787;3773,135.2,0.500,1.000,0.613,1,
|
||||
single,cl_002,crosslingual_ko_en,semantic_search,document,산업 안전 입문서,3755;3775;3776;3777,3819;3755;3807;3802;3815;3817;3774;3775;3810;3800,134.7,0.500,0.500,0.369,1,
|
||||
single,cl_003,crosslingual_ko_en,semantic_search,document,전기 안전 위험,3772;3790,3790;3897;3775;3772;3755;3771;3769;3774;3766;3799,148.2,1.000,1.000,0.877,1,
|
||||
single,news_001,news_ko,semantic_search,news,이란과 미국의 군사 충돌,4303;4304;4307;4316;4322;4323;4327;4335,4317;4452;4329;4321;4307;4339;4331;4744;4642;4743,129.8,0.125,0.200,0.098,1,
|
||||
single,news_002,news_ko,semantic_search,news,호르무즈 해협 봉쇄,4316;4320;4322;4327,4346;4320;4767;4349;4762;4322;4340;4759;4304;4642,126.3,0.500,0.500,0.385,0,
|
||||
single,news_003,news_en,semantic_search,news,Trump Iran ultimatum,4258;4260;4262,4776;4775;4679;4519;4258;4199;4670;4202;4668;4515,125.1,0.333,0.200,0.182,1,
|
||||
single,news_004,news_fr,semantic_search,news,guerre en Iran,4199;4202;4210;4361;4363;4507;4519;4521,4776;4199;4507;4519;4688;4211;4678;4258;4363;4691,129.4,0.500,0.500,0.471,1,
|
||||
single,news_005,news_crosslingual,semantic_search,news,이란 미국 전쟁 글로벌 반응,4202;4258;4262;4536;4303;4304;4316,4457;4307;4452;4765;4329;4345;4324;4443;4761;4444,133.6,0.000,0.000,0.000,1,
|
||||
single,misc_001,other_domain,fact_lookup,document,강체의 평면 운동학,4063;4065,4063;4071;4064;4065;4066;4058;4067;4069;4068;4062,205.9,1.000,1.000,0.877,1,
|
||||
single,misc_002,other_domain,semantic_search,document,질점의 운동역학,4060;4061;4062,4062;4060;4061;4070;4058;4059;4064;4068;4066;4065,263.6,1.000,1.000,1.000,1,
|
||||
single,fail_001,failure_expected,semantic_search,document,Rust async runtime tokio scheduler 내부 구조,,3810;4547;4546;3774;4540;3812;4069;3819;3787;4062,139.1,0.000,0.000,0.000,1,
|
||||
single,fail_002,failure_expected,semantic_search,document,양자컴퓨터 큐비트 디코히어런스,,3817;3795;3856;4068;4064;4539;4058;3800;3904;4057,129.4,0.000,0.000,0.000,1,
|
||||
single,fail_003,failure_expected,semantic_search,news,재즈 보컬리스트 빌리 홀리데이,,4634;4675;4697;4205;4289;4281;4116;4100;4057;3757,126.5,0.000,0.000,0.000,1,
|
||||
|
Reference in New Issue
Block a user