Spaces:
				
			
			
	
			
			
					
		Running
		
	
	
	
			
			
	
	
	
	
		
		
					
		Running
		
	
		mehran
		
	commited on
		
		
					Commit 
							
							Β·
						
						7d9ae8d
	
1
								Parent(s):
							
							3e59826
								
add gpt 5 and oss and llama4 scout
Browse files- leaderboard/boards_data/MMLU.jsonl +5 -0
- leaderboard/boards_data/all.jsonl +5 -0
- leaderboard/boards_data/extractive-qa_PQuAD.jsonl +5 -0
- leaderboard/boards_data/ifeval.jsonl +6 -1
- leaderboard/boards_data/keyword-extraction_SynKeywords.jsonl +5 -0
- leaderboard/boards_data/mt_bench.jsonl +5 -0
- leaderboard/boards_data/ner_arman.jsonl +5 -0
- leaderboard/boards_data/nli_farstail.jsonl +5 -0
- leaderboard/boards_data/paraphrase-detection_FarsiParaphraseDetection.jsonl +5 -0
- leaderboard/boards_data/paraphrase-detection_parsinlu.jsonl +5 -0
- leaderboard/boards_data/persian_csr.jsonl +5 -0
- leaderboard/boards_data/persian_nlg.jsonl +5 -0
- leaderboard/boards_data/persian_nlu.jsonl +0 -0
- leaderboard/boards_data/question-generation_PersianQA.jsonl +5 -0
- leaderboard/boards_data/sentiment-analysis_deepsentipers.jsonl +5 -0
- leaderboard/boards_data/sts_FarSICK.jsonl +5 -0
- leaderboard/boards_data/sts_SynPerSTS.jsonl +5 -0
- leaderboard/boards_data/summarization_PnSummary.jsonl +5 -0
- leaderboard/boards_data/summarization_SamSUM-fa.jsonl +5 -0
- leaderboard/boards_data/tone-classification_SynTone.jsonl +5 -0
- leaderboard/boards_data/topic-classification_sid.jsonl +5 -0
- leaderboard/boards_data/translation-ar2fa_ar2fa.jsonl +5 -0
- leaderboard/boards_data/translation-en2fa_en2fa.jsonl +5 -0
- leaderboard/boards_data/translation-fa2ar_fa2ar.jsonl +5 -0
- leaderboard/boards_data/translation-fa2en_fa2en.jsonl +5 -0
- leaderboard/leaderboard_config.yaml +25 -0
    	
        leaderboard/boards_data/MMLU.jsonl
    CHANGED
    
    | @@ -1,17 +1,22 @@ | |
| 1 | 
             
            {"Model Name":"gemini-2.5-pro","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8401114206,"cinema_acc":0.9375,"emergency_number_acc":0.8,"foods_acc":0.8,"games_acc":0.55,"herbal_drugs_acc":0.75,"places_acc":0.8857142857,"poetry_acc":0.9,"politicians_acc":0.95,"popular_people_acc":0.9282051282,"Government_law_acc":0.9782608696,"proverbs_acc":0.9,"religous_acc":0.9777777778,"social_manners_acc":0.9438202247,"souvenirs_acc":0.78,"sports_acc":0.6507936508,"GPK_acc":0.8733798604,"SPK_acc":0.856476498,"UPK_acc":0.824103816}
         | 
| 2 | 
             
            {"Model Name":"o3","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8217442751,"cinema_acc":0.8125,"emergency_number_acc":1.0,"foods_acc":0.77,"games_acc":0.75,"herbal_drugs_acc":0.65,"places_acc":0.8952380952,"poetry_acc":0.875,"politicians_acc":1.0,"popular_people_acc":0.9179487179,"Government_law_acc":0.8913043478,"proverbs_acc":0.89,"religous_acc":0.9555555556,"social_manners_acc":0.8876404494,"souvenirs_acc":0.78,"sports_acc":0.5714285714,"GPK_acc":0.8454636092,"SPK_acc":0.833781603,"UPK_acc":0.8100680622}
         | 
|  | |
| 3 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7274624374,"cinema_acc":0.8875,"emergency_number_acc":0.8,"foods_acc":0.82,"games_acc":0.4,"herbal_drugs_acc":0.75,"places_acc":0.8952380952,"poetry_acc":0.9,"politicians_acc":0.9,"popular_people_acc":0.8564102564,"Government_law_acc":0.9565217391,"proverbs_acc":0.87,"religous_acc":0.9555555556,"social_manners_acc":0.9101123596,"souvenirs_acc":0.72,"sports_acc":0.5873015873,"GPK_acc":0.8394815553,"SPK_acc":0.7645583229,"UPK_acc":0.686473306}
         | 
| 4 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7214996174,"cinema_acc":0.6875,"emergency_number_acc":0.7,"foods_acc":0.74,"games_acc":0.5,"herbal_drugs_acc":0.675,"places_acc":0.8476190476,"poetry_acc":0.8,"politicians_acc":0.95,"popular_people_acc":0.8615384615,"Government_law_acc":0.8913043478,"proverbs_acc":0.77,"religous_acc":0.9333333333,"social_manners_acc":0.9101123596,"souvenirs_acc":0.72,"sports_acc":0.6031746032,"GPK_acc":0.7936191426,"SPK_acc":0.7588245834,"UPK_acc":0.6854869755}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7040411769,"cinema_acc":0.7625,"emergency_number_acc":0.9,"foods_acc":0.78,"games_acc":0.7,"herbal_drugs_acc":0.625,"places_acc":0.8666666667,"poetry_acc":0.875,"politicians_acc":0.85,"popular_people_acc":0.8461538462,"Government_law_acc":0.8913043478,"proverbs_acc":0.86,"religous_acc":0.8888888889,"social_manners_acc":0.8651685393,"souvenirs_acc":0.68,"sports_acc":0.4761904762,"GPK_acc":0.8005982054,"SPK_acc":0.7258555814,"UPK_acc":0.6759912742}
         | 
| 6 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6957640676,"cinema_acc":0.725,"emergency_number_acc":0.6,"foods_acc":0.79,"games_acc":0.5,"herbal_drugs_acc":0.75,"places_acc":0.8380952381,"poetry_acc":0.825,"politicians_acc":0.75,"popular_people_acc":0.7846153846,"Government_law_acc":0.9565217391,"proverbs_acc":0.78,"religous_acc":0.9111111111,"social_manners_acc":0.8539325843,"souvenirs_acc":0.74,"sports_acc":0.4761904762,"GPK_acc":0.7756729811,"SPK_acc":0.7263931195,"UPK_acc":0.6635442063}
         | 
| 7 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6884607359,"cinema_acc":0.75,"emergency_number_acc":0.7,"foods_acc":0.78,"games_acc":0.6,"herbal_drugs_acc":0.7,"places_acc":0.8380952381,"poetry_acc":0.9,"politicians_acc":0.95,"popular_people_acc":0.8615384615,"Government_law_acc":0.9347826087,"proverbs_acc":0.8,"religous_acc":0.9333333333,"social_manners_acc":0.8426966292,"souvenirs_acc":0.66,"sports_acc":0.5555555556,"GPK_acc":0.8015952144,"SPK_acc":0.720121842,"UPK_acc":0.6512254587}
         | 
|  | |
| 8 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","acc":0.6810513107,"cinema_acc":0.5125,"emergency_number_acc":0.5,"foods_acc":0.63,"games_acc":0.55,"herbal_drugs_acc":0.65,"places_acc":0.8666666667,"poetry_acc":0.55,"politicians_acc":0.8,"popular_people_acc":0.7435897436,"Government_law_acc":0.9347826087,"proverbs_acc":0.81,"religous_acc":0.9111111111,"social_manners_acc":0.8764044944,"souvenirs_acc":0.72,"sports_acc":0.5079365079,"GPK_acc":0.7288135593,"SPK_acc":0.7400865177,"UPK_acc":0.6328756576}
         | 
|  | |
| 9 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6466578563,"cinema_acc":0.7125,"emergency_number_acc":0.6,"foods_acc":0.72,"games_acc":0.5,"herbal_drugs_acc":0.7,"places_acc":0.8666666667,"poetry_acc":0.8,"politicians_acc":0.8,"popular_people_acc":0.7743589744,"Government_law_acc":0.9347826087,"proverbs_acc":0.77,"religous_acc":0.9111111111,"social_manners_acc":0.8539325843,"souvenirs_acc":0.68,"sports_acc":0.5873015873,"GPK_acc":0.7686939182,"SPK_acc":0.6764020785,"UPK_acc":0.6096496856}
         | 
| 10 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6128538638,"cinema_acc":0.525,"emergency_number_acc":0.7,"foods_acc":0.73,"games_acc":0.55,"herbal_drugs_acc":0.625,"places_acc":0.8380952381,"poetry_acc":0.575,"politicians_acc":0.6,"popular_people_acc":0.7076923077,"Government_law_acc":0.847826087,"proverbs_acc":0.71,"religous_acc":0.6666666667,"social_manners_acc":0.8202247191,"souvenirs_acc":0.68,"sports_acc":0.4920634921,"GPK_acc":0.6949152542,"SPK_acc":0.6265902168,"UPK_acc":0.5924547671}
         | 
| 11 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","acc":0.5980651448,"cinema_acc":0.6,"emergency_number_acc":0.5,"foods_acc":0.67,"games_acc":0.65,"herbal_drugs_acc":0.675,"places_acc":0.8476190476,"poetry_acc":0.775,"politicians_acc":0.95,"popular_people_acc":0.8092783505,"Government_law_acc":0.8913043478,"proverbs_acc":0.78,"religous_acc":0.8666666667,"social_manners_acc":0.8988764045,"souvenirs_acc":0.68,"sports_acc":0.5396825397,"GPK_acc":0.7604790419,"SPK_acc":0.6417428725,"UPK_acc":0.5458980614}
         | 
|  | |
| 12 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","acc":0.5908047576,"cinema_acc":0.5875,"emergency_number_acc":0.4,"foods_acc":0.56,"games_acc":0.55,"herbal_drugs_acc":0.75,"places_acc":0.8285714286,"poetry_acc":0.75,"politicians_acc":0.7,"popular_people_acc":0.7794871795,"Government_law_acc":0.8695652174,"proverbs_acc":0.78,"religous_acc":0.8444444444,"social_manners_acc":0.808988764,"souvenirs_acc":0.74,"sports_acc":0.5555555556,"GPK_acc":0.7288135593,"SPK_acc":0.6348324673,"UPK_acc":0.541511613}
         | 
| 13 | 
             
            {"Model Name":"Llama-3.3-70B-Instruct","thinking_method":"β","model_url":"https_google.com","parameters_count":"70600000000","source_type":"Open-Source","acc":0.5714086374,"cinema_acc":0.5625,"emergency_number_acc":0.3,"foods_acc":0.56,"games_acc":0.6,"herbal_drugs_acc":0.575,"places_acc":0.8095238095,"poetry_acc":0.6,"politicians_acc":0.85,"popular_people_acc":0.7282051282,"Government_law_acc":0.8913043478,"proverbs_acc":0.7,"religous_acc":0.8222222222,"social_manners_acc":0.8539325843,"souvenirs_acc":0.6,"sports_acc":0.5555555556,"GPK_acc":0.6939182453,"SPK_acc":0.605489774,"UPK_acc":0.5310727179}
         | 
| 14 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.56986854,"cinema_acc":0.6625,"emergency_number_acc":0.4,"foods_acc":0.71,"games_acc":0.45,"herbal_drugs_acc":0.675,"places_acc":0.7714285714,"poetry_acc":0.675,"politicians_acc":0.75,"popular_people_acc":0.6820512821,"Government_law_acc":0.8913043478,"proverbs_acc":0.75,"religous_acc":0.7777777778,"social_manners_acc":0.7865168539,"souvenirs_acc":0.68,"sports_acc":0.5555555556,"GPK_acc":0.7078763709,"SPK_acc":0.6075972048,"UPK_acc":0.5250866162}
         | 
|  | |
| 15 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","acc":0.5635086255,"cinema_acc":0.45,"emergency_number_acc":0.2,"foods_acc":0.49,"games_acc":0.45,"herbal_drugs_acc":0.45,"places_acc":0.6285714286,"poetry_acc":0.35,"politicians_acc":0.3,"popular_people_acc":0.4974358974,"Government_law_acc":0.7608695652,"proverbs_acc":0.64,"religous_acc":0.6888888889,"social_manners_acc":0.8202247191,"souvenirs_acc":0.56,"sports_acc":0.3968253968,"GPK_acc":0.5513459621,"SPK_acc":0.5967741935,"UPK_acc":0.5412549724}
         | 
| 16 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","acc":0.5633303193,"cinema_acc":0.625,"emergency_number_acc":0.4,"foods_acc":0.68,"games_acc":0.35,"herbal_drugs_acc":0.6,"places_acc":0.7904761905,"poetry_acc":0.7,"politicians_acc":0.75,"popular_people_acc":0.641025641,"Government_law_acc":0.8913043478,"proverbs_acc":0.74,"religous_acc":0.7777777778,"social_manners_acc":0.8764044944,"souvenirs_acc":0.62,"sports_acc":0.6031746032,"GPK_acc":0.6989032901,"SPK_acc":0.5977423401,"UPK_acc":0.5212370076}
         | 
| 17 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.5440356745,"cinema_acc":0.5263157895,"emergency_number_acc":0.4,"foods_acc":0.72,"games_acc":0.55,"herbal_drugs_acc":0.575,"places_acc":0.8095238095,"poetry_acc":0.625,"politicians_acc":0.75,"popular_people_acc":0.6717948718,"Government_law_acc":0.8043478261,"proverbs_acc":0.72,"religous_acc":0.8444444444,"social_manners_acc":0.8539325843,"souvenirs_acc":0.6,"sports_acc":0.4920634921,"GPK_acc":0.6906906907,"SPK_acc":0.5934420355,"UPK_acc":0.4897066392}
         | 
|  | |
| 1 | 
             
            {"Model Name":"gemini-2.5-pro","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8401114206,"cinema_acc":0.9375,"emergency_number_acc":0.8,"foods_acc":0.8,"games_acc":0.55,"herbal_drugs_acc":0.75,"places_acc":0.8857142857,"poetry_acc":0.9,"politicians_acc":0.95,"popular_people_acc":0.9282051282,"Government_law_acc":0.9782608696,"proverbs_acc":0.9,"religous_acc":0.9777777778,"social_manners_acc":0.9438202247,"souvenirs_acc":0.78,"sports_acc":0.6507936508,"GPK_acc":0.8733798604,"SPK_acc":0.856476498,"UPK_acc":0.824103816}
         | 
| 2 | 
             
            {"Model Name":"o3","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8217442751,"cinema_acc":0.8125,"emergency_number_acc":1.0,"foods_acc":0.77,"games_acc":0.75,"herbal_drugs_acc":0.65,"places_acc":0.8952380952,"poetry_acc":0.875,"politicians_acc":1.0,"popular_people_acc":0.9179487179,"Government_law_acc":0.8913043478,"proverbs_acc":0.89,"religous_acc":0.9555555556,"social_manners_acc":0.8876404494,"souvenirs_acc":0.78,"sports_acc":0.5714285714,"GPK_acc":0.8454636092,"SPK_acc":0.833781603,"UPK_acc":0.8100680622}
         | 
| 3 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7620504973,"cinema_acc":0.6375,"emergency_number_acc":0.6,"foods_acc":0.77,"games_acc":0.5,"herbal_drugs_acc":0.65,"places_acc":0.8857142857,"poetry_acc":0.65,"politicians_acc":0.8,"popular_people_acc":0.8153846154,"Government_law_acc":0.9347826087,"proverbs_acc":0.74,"religous_acc":0.8888888889,"social_manners_acc":0.8539325843,"souvenirs_acc":0.74,"sports_acc":0.5555555556,"GPK_acc":0.7666999003,"SPK_acc":0.7674251926,"UPK_acc":0.757602977}
         | 
| 4 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7274624374,"cinema_acc":0.8875,"emergency_number_acc":0.8,"foods_acc":0.82,"games_acc":0.4,"herbal_drugs_acc":0.75,"places_acc":0.8952380952,"poetry_acc":0.9,"politicians_acc":0.9,"popular_people_acc":0.8564102564,"Government_law_acc":0.9565217391,"proverbs_acc":0.87,"religous_acc":0.9555555556,"social_manners_acc":0.9101123596,"souvenirs_acc":0.72,"sports_acc":0.5873015873,"GPK_acc":0.8394815553,"SPK_acc":0.7645583229,"UPK_acc":0.686473306}
         | 
| 5 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7214996174,"cinema_acc":0.6875,"emergency_number_acc":0.7,"foods_acc":0.74,"games_acc":0.5,"herbal_drugs_acc":0.675,"places_acc":0.8476190476,"poetry_acc":0.8,"politicians_acc":0.95,"popular_people_acc":0.8615384615,"Government_law_acc":0.8913043478,"proverbs_acc":0.77,"religous_acc":0.9333333333,"social_manners_acc":0.9101123596,"souvenirs_acc":0.72,"sports_acc":0.6031746032,"GPK_acc":0.7936191426,"SPK_acc":0.7588245834,"UPK_acc":0.6854869755}
         | 
| 6 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7040411769,"cinema_acc":0.7625,"emergency_number_acc":0.9,"foods_acc":0.78,"games_acc":0.7,"herbal_drugs_acc":0.625,"places_acc":0.8666666667,"poetry_acc":0.875,"politicians_acc":0.85,"popular_people_acc":0.8461538462,"Government_law_acc":0.8913043478,"proverbs_acc":0.86,"religous_acc":0.8888888889,"social_manners_acc":0.8651685393,"souvenirs_acc":0.68,"sports_acc":0.4761904762,"GPK_acc":0.8005982054,"SPK_acc":0.7258555814,"UPK_acc":0.6759912742}
         | 
| 7 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6957640676,"cinema_acc":0.725,"emergency_number_acc":0.6,"foods_acc":0.79,"games_acc":0.5,"herbal_drugs_acc":0.75,"places_acc":0.8380952381,"poetry_acc":0.825,"politicians_acc":0.75,"popular_people_acc":0.7846153846,"Government_law_acc":0.9565217391,"proverbs_acc":0.78,"religous_acc":0.9111111111,"social_manners_acc":0.8539325843,"souvenirs_acc":0.74,"sports_acc":0.4761904762,"GPK_acc":0.7756729811,"SPK_acc":0.7263931195,"UPK_acc":0.6635442063}
         | 
| 8 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6884607359,"cinema_acc":0.75,"emergency_number_acc":0.7,"foods_acc":0.78,"games_acc":0.6,"herbal_drugs_acc":0.7,"places_acc":0.8380952381,"poetry_acc":0.9,"politicians_acc":0.95,"popular_people_acc":0.8615384615,"Government_law_acc":0.9347826087,"proverbs_acc":0.8,"religous_acc":0.9333333333,"social_manners_acc":0.8426966292,"souvenirs_acc":0.66,"sports_acc":0.5555555556,"GPK_acc":0.8015952144,"SPK_acc":0.720121842,"UPK_acc":0.6512254587}
         | 
| 9 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6864436252,"cinema_acc":0.5375,"emergency_number_acc":0.5,"foods_acc":0.72,"games_acc":0.5,"herbal_drugs_acc":0.7,"places_acc":0.8095238095,"poetry_acc":0.425,"politicians_acc":0.6,"popular_people_acc":0.7128205128,"Government_law_acc":0.9347826087,"proverbs_acc":0.69,"religous_acc":0.8222222222,"social_manners_acc":0.7415730337,"souvenirs_acc":0.68,"sports_acc":0.5873015873,"GPK_acc":0.6949152542,"SPK_acc":0.6867944813,"UPK_acc":0.6851020146}
         | 
| 10 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","acc":0.6810513107,"cinema_acc":0.5125,"emergency_number_acc":0.5,"foods_acc":0.63,"games_acc":0.55,"herbal_drugs_acc":0.65,"places_acc":0.8666666667,"poetry_acc":0.55,"politicians_acc":0.8,"popular_people_acc":0.7435897436,"Government_law_acc":0.9347826087,"proverbs_acc":0.81,"religous_acc":0.9111111111,"social_manners_acc":0.8764044944,"souvenirs_acc":0.72,"sports_acc":0.5079365079,"GPK_acc":0.7288135593,"SPK_acc":0.7400865177,"UPK_acc":0.6328756576}
         | 
| 11 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","acc":0.6772622939,"cinema_acc":0.475,"emergency_number_acc":0.4,"foods_acc":0.75,"games_acc":0.5,"herbal_drugs_acc":0.625,"places_acc":0.8,"poetry_acc":0.525,"politicians_acc":0.55,"popular_people_acc":0.6666666667,"Government_law_acc":0.8695652174,"proverbs_acc":0.53,"religous_acc":0.7555555556,"social_manners_acc":0.7640449438,"souvenirs_acc":0.6,"sports_acc":0.4761904762,"GPK_acc":0.6510468594,"SPK_acc":0.6792689482,"UPK_acc":0.6791992814}
         | 
| 12 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6466578563,"cinema_acc":0.7125,"emergency_number_acc":0.6,"foods_acc":0.72,"games_acc":0.5,"herbal_drugs_acc":0.7,"places_acc":0.8666666667,"poetry_acc":0.8,"politicians_acc":0.8,"popular_people_acc":0.7743589744,"Government_law_acc":0.9347826087,"proverbs_acc":0.77,"religous_acc":0.9111111111,"social_manners_acc":0.8539325843,"souvenirs_acc":0.68,"sports_acc":0.5873015873,"GPK_acc":0.7686939182,"SPK_acc":0.6764020785,"UPK_acc":0.6096496856}
         | 
| 13 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.6128538638,"cinema_acc":0.525,"emergency_number_acc":0.7,"foods_acc":0.73,"games_acc":0.55,"herbal_drugs_acc":0.625,"places_acc":0.8380952381,"poetry_acc":0.575,"politicians_acc":0.6,"popular_people_acc":0.7076923077,"Government_law_acc":0.847826087,"proverbs_acc":0.71,"religous_acc":0.6666666667,"social_manners_acc":0.8202247191,"souvenirs_acc":0.68,"sports_acc":0.4920634921,"GPK_acc":0.6949152542,"SPK_acc":0.6265902168,"UPK_acc":0.5924547671}
         | 
| 14 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","acc":0.5980651448,"cinema_acc":0.6,"emergency_number_acc":0.5,"foods_acc":0.67,"games_acc":0.65,"herbal_drugs_acc":0.675,"places_acc":0.8476190476,"poetry_acc":0.775,"politicians_acc":0.95,"popular_people_acc":0.8092783505,"Government_law_acc":0.8913043478,"proverbs_acc":0.78,"religous_acc":0.8666666667,"social_manners_acc":0.8988764045,"souvenirs_acc":0.68,"sports_acc":0.5396825397,"GPK_acc":0.7604790419,"SPK_acc":0.6417428725,"UPK_acc":0.5458980614}
         | 
| 15 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","acc":0.5958127565,"cinema_acc":0.45,"emergency_number_acc":0.2,"foods_acc":0.51,"games_acc":0.3,"herbal_drugs_acc":0.475,"places_acc":0.6761904762,"poetry_acc":0.425,"politicians_acc":0.25,"popular_people_acc":0.4923076923,"Government_law_acc":0.8260869565,"proverbs_acc":0.54,"religous_acc":0.6666666667,"social_manners_acc":0.7191011236,"souvenirs_acc":0.46,"sports_acc":0.3650793651,"GPK_acc":0.5333998006,"SPK_acc":0.5954130084,"UPK_acc":0.6041319133}
         | 
| 16 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","acc":0.5908047576,"cinema_acc":0.5875,"emergency_number_acc":0.4,"foods_acc":0.56,"games_acc":0.55,"herbal_drugs_acc":0.75,"places_acc":0.8285714286,"poetry_acc":0.75,"politicians_acc":0.7,"popular_people_acc":0.7794871795,"Government_law_acc":0.8695652174,"proverbs_acc":0.78,"religous_acc":0.8444444444,"social_manners_acc":0.808988764,"souvenirs_acc":0.74,"sports_acc":0.5555555556,"GPK_acc":0.7288135593,"SPK_acc":0.6348324673,"UPK_acc":0.541511613}
         | 
| 17 | 
             
            {"Model Name":"Llama-3.3-70B-Instruct","thinking_method":"β","model_url":"https_google.com","parameters_count":"70600000000","source_type":"Open-Source","acc":0.5714086374,"cinema_acc":0.5625,"emergency_number_acc":0.3,"foods_acc":0.56,"games_acc":0.6,"herbal_drugs_acc":0.575,"places_acc":0.8095238095,"poetry_acc":0.6,"politicians_acc":0.85,"popular_people_acc":0.7282051282,"Government_law_acc":0.8913043478,"proverbs_acc":0.7,"religous_acc":0.8222222222,"social_manners_acc":0.8539325843,"souvenirs_acc":0.6,"sports_acc":0.5555555556,"GPK_acc":0.6939182453,"SPK_acc":0.605489774,"UPK_acc":0.5310727179}
         | 
| 18 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.56986854,"cinema_acc":0.6625,"emergency_number_acc":0.4,"foods_acc":0.71,"games_acc":0.45,"herbal_drugs_acc":0.675,"places_acc":0.7714285714,"poetry_acc":0.675,"politicians_acc":0.75,"popular_people_acc":0.6820512821,"Government_law_acc":0.8913043478,"proverbs_acc":0.75,"religous_acc":0.7777777778,"social_manners_acc":0.7865168539,"souvenirs_acc":0.68,"sports_acc":0.5555555556,"GPK_acc":0.7078763709,"SPK_acc":0.6075972048,"UPK_acc":0.5250866162}
         | 
| 19 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https_google.com","parameters_count":"109000000000","source_type":"Open-Source","acc":0.5639563191,"cinema_acc":0.65,"emergency_number_acc":0.5,"foods_acc":0.64,"games_acc":0.55,"herbal_drugs_acc":0.625,"places_acc":0.819047619,"poetry_acc":0.725,"politicians_acc":0.85,"popular_people_acc":0.7487179487,"Government_law_acc":0.847826087,"proverbs_acc":0.73,"religous_acc":0.8666666667,"social_manners_acc":0.8202247191,"souvenirs_acc":0.72,"sports_acc":0.5079365079,"GPK_acc":0.7248255234,"SPK_acc":0.5948754703,"UPK_acc":0.5211086873}
         | 
| 20 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","acc":0.5635086255,"cinema_acc":0.45,"emergency_number_acc":0.2,"foods_acc":0.49,"games_acc":0.45,"herbal_drugs_acc":0.45,"places_acc":0.6285714286,"poetry_acc":0.35,"politicians_acc":0.3,"popular_people_acc":0.4974358974,"Government_law_acc":0.7608695652,"proverbs_acc":0.64,"religous_acc":0.6888888889,"social_manners_acc":0.8202247191,"souvenirs_acc":0.56,"sports_acc":0.3968253968,"GPK_acc":0.5513459621,"SPK_acc":0.5967741935,"UPK_acc":0.5412549724}
         | 
| 21 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","acc":0.5633303193,"cinema_acc":0.625,"emergency_number_acc":0.4,"foods_acc":0.68,"games_acc":0.35,"herbal_drugs_acc":0.6,"places_acc":0.7904761905,"poetry_acc":0.7,"politicians_acc":0.75,"popular_people_acc":0.641025641,"Government_law_acc":0.8913043478,"proverbs_acc":0.74,"religous_acc":0.7777777778,"social_manners_acc":0.8764044944,"souvenirs_acc":0.62,"sports_acc":0.6031746032,"GPK_acc":0.6989032901,"SPK_acc":0.5977423401,"UPK_acc":0.5212370076}
         | 
| 22 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.5440356745,"cinema_acc":0.5263157895,"emergency_number_acc":0.4,"foods_acc":0.72,"games_acc":0.55,"herbal_drugs_acc":0.575,"places_acc":0.8095238095,"poetry_acc":0.625,"politicians_acc":0.75,"popular_people_acc":0.6717948718,"Government_law_acc":0.8043478261,"proverbs_acc":0.72,"religous_acc":0.8444444444,"social_manners_acc":0.8539325843,"souvenirs_acc":0.6,"sports_acc":0.4920634921,"GPK_acc":0.6906906907,"SPK_acc":0.5934420355,"UPK_acc":0.4897066392}
         | 
    	
        leaderboard/boards_data/all.jsonl
    CHANGED
    
    | @@ -1,11 +1,14 @@ | |
| 1 | 
             
            {"Model Name":"o3","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7468,"Persian IFEval":0.926035503,"Persian MT-Bench":0.91375,"PerMMLU":0.8217442751,"PerCoR":0.9218,"Persian NLU":0.7207167537,"Persian NLG":0.1764906292}
         | 
| 2 | 
             
            {"Model Name":"gemini-2.5-pro","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7332,"Persian IFEval":0.8911764706,"Persian MT-Bench":0.91075,"PerMMLU":0.8401114206,"PerCoR":0.9427585507,"Persian NLU":0.6992555201,"Persian NLG":0.1151518212}
         | 
|  | |
| 3 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7127,"Persian IFEval":0.8810572687,"Persian MT-Bench":0.8695,"PerMMLU":0.7214996174,"PerCoR":0.9117647059,"Persian NLU":0.7143086066,"Persian NLG":0.1779340777}
         | 
| 4 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6992,"Persian IFEval":0.8634361233,"Persian MT-Bench":0.87325,"PerMMLU":0.7040411769,"PerCoR":0.8839,"Persian NLU":0.6758278127,"Persian NLG":0.194675133}
         | 
| 5 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6986,"Persian IFEval":0.8796992481,"Persian MT-Bench":0.8812289562,"PerMMLU":0.7274624374,"PerCoR":0.8717,"Persian NLU":0.6944128198,"Persian NLG":0.1368740087}
         | 
| 6 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6886,"Persian IFEval":0.8497790869,"Persian MT-Bench":0.838973064,"PerMMLU":0.6957640676,"PerCoR":0.8637863786,"Persian NLU":0.7050532433,"Persian NLG":0.178231145}
         | 
| 7 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6877,"Persian IFEval":0.8296622614,"Persian MT-Bench":0.8371666667,"PerMMLU":0.6884607359,"PerCoR":0.8665,"Persian NLU":0.7146808531,"Persian NLG":0.18964968}
         | 
| 8 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.664,"Persian IFEval":0.8414096916,"Persian MT-Bench":0.8244166667,"PerMMLU":0.6466578563,"PerCoR":0.8143,"Persian NLU":0.6914202844,"Persian NLG":0.1659339021}
         | 
|  | |
|  | |
| 9 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6556,"Persian IFEval":0.8340675477,"Persian MT-Bench":0.8418333333,"PerMMLU":0.6128538638,"PerCoR":0.7712,"Persian NLU":0.6833497104,"Persian NLG":0.1901206806}
         | 
| 10 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","Average":0.6549,"Persian IFEval":0.8370044053,"Persian MT-Bench":0.86175,"PerMMLU":0.6810513107,"PerCoR":0.825165033,"Persian NLU":0.6361186163,"Persian NLG":0.0880621978}
         | 
| 11 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","Average":0.6458,"Persian IFEval":0.8311306902,"Persian MT-Bench":0.8600833333,"PerMMLU":0.5908047576,"PerCoR":0.8241,"Persian NLU":0.6752949557,"Persian NLG":0.0934094344}
         | 
| @@ -14,9 +17,11 @@ | |
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","Average":0.6224,"Persian IFEval":0.803030303,"Persian MT-Bench":0.7632996633,"PerMMLU":0.5635086255,"PerCoR":0.7654,"Persian NLU":0.6714091535,"Persian NLG":0.1679338638}
         | 
| 15 | 
             
            {"Model Name":"Llama-3.3-70B-Instruct","thinking_method":"β","model_url":"https_google.com","parameters_count":"70600000000","source_type":"Open-Source","Average":0.613,"Persian IFEval":0.7125925926,"Persian MT-Bench":0.7172558923,"PerMMLU":0.5714086374,"PerCoR":0.7956,"Persian NLU":0.6800109206,"Persian NLG":0.2010896964}
         | 
| 16 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","Average":0.6098,"Persian IFEval":0.8438880707,"Persian MT-Bench":0.8219166667,"PerMMLU":0.5980651448,"PerCoR":0.798859772,"Persian NLU":0.4824528512,"Persian NLG":0.1137933652}
         | 
|  | |
| 17 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","Average":0.6008,"Persian IFEval":0.8149779736,"Persian MT-Bench":0.75125,"PerMMLU":0.5105376643,"PerCoR":0.7094,"Persian NLU":0.699116864,"Persian NLG":0.1196804312}
         | 
| 18 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","Average":0.5939,"Persian IFEval":0.8325508607,"Persian MT-Bench":0.7431271478,"PerMMLU":0.5097725534,"PerCoR":0.688,"Persian NLU":0.6255818412,"Persian NLG":0.164118288}
         | 
| 19 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","Average":0.5912,"Persian IFEval":0.8105726872,"Persian MT-Bench":0.7204545455,"PerMMLU":0.5139458858,"PerCoR":0.6958,"Persian NLU":0.6460328733,"Persian NLG":0.16056333}
         | 
|  | |
| 20 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https_google.com","parameters_count":"104000000000","source_type":"Open-Source","Average":0.5705,"Persian IFEval":0.7007407407,"Persian MT-Bench":0.688,"PerMMLU":0.4800723378,"PerCoR":0.7364,"Persian NLU":0.6297634971,"Persian NLG":0.1880477876}
         | 
| 21 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","Average":0.5576,"Persian IFEval":0.7526555387,"Persian MT-Bench":0.7290833333,"PerMMLU":0.4763231198,"PerCoR":0.6894,"Persian NLU":0.5661558794,"Persian NLG":0.1319091735}
         | 
| 22 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.5546,"Persian IFEval":0.825256975,"Persian MT-Bench":0.7585,"PerMMLU":0.5440356745,"PerCoR":0.7160432086,"Persian NLU":0.3749414991,"Persian NLG":0.1089333827}
         | 
|  | |
| 1 | 
             
            {"Model Name":"o3","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7468,"Persian IFEval":0.926035503,"Persian MT-Bench":0.91375,"PerMMLU":0.8217442751,"PerCoR":0.9218,"Persian NLU":0.7207167537,"Persian NLG":0.1764906292}
         | 
| 2 | 
             
            {"Model Name":"gemini-2.5-pro","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7332,"Persian IFEval":0.8911764706,"Persian MT-Bench":0.91075,"PerMMLU":0.8401114206,"PerCoR":0.9427585507,"Persian NLU":0.6992555201,"Persian NLG":0.1151518212}
         | 
| 3 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7169,"Persian IFEval":0.9104258443,"Persian MT-Bench":0.86775,"PerMMLU":0.7620504973,"PerCoR":0.8651,"Persian NLU":0.7144353486,"Persian NLG":0.181552926}
         | 
| 4 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.7127,"Persian IFEval":0.8810572687,"Persian MT-Bench":0.8695,"PerMMLU":0.7214996174,"PerCoR":0.9117647059,"Persian NLU":0.7143086066,"Persian NLG":0.1779340777}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6992,"Persian IFEval":0.8634361233,"Persian MT-Bench":0.87325,"PerMMLU":0.7040411769,"PerCoR":0.8839,"Persian NLU":0.6758278127,"Persian NLG":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6986,"Persian IFEval":0.8796992481,"Persian MT-Bench":0.8812289562,"PerMMLU":0.7274624374,"PerCoR":0.8717,"Persian NLU":0.6944128198,"Persian NLG":0.1368740087}
         | 
| 7 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6886,"Persian IFEval":0.8497790869,"Persian MT-Bench":0.838973064,"PerMMLU":0.6957640676,"PerCoR":0.8637863786,"Persian NLU":0.7050532433,"Persian NLG":0.178231145}
         | 
| 8 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6877,"Persian IFEval":0.8296622614,"Persian MT-Bench":0.8371666667,"PerMMLU":0.6884607359,"PerCoR":0.8665,"Persian NLU":0.7146808531,"Persian NLG":0.18964968}
         | 
| 9 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.664,"Persian IFEval":0.8414096916,"Persian MT-Bench":0.8244166667,"PerMMLU":0.6466578563,"PerCoR":0.8143,"Persian NLU":0.6914202844,"Persian NLG":0.1659339021}
         | 
| 10 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6637,"Persian IFEval":0.8972099853,"Persian MT-Bench":0.82825,"PerMMLU":0.6864436252,"PerCoR":0.731,"Persian NLU":0.6749652797,"Persian NLG":0.1643361642}
         | 
| 11 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","Average":0.6573,"Persian IFEval":0.8702064897,"Persian MT-Bench":0.8315833333,"PerMMLU":0.6772622939,"PerCoR":0.7643,"Persian NLU":0.6552939868,"Persian NLG":0.1454089411}
         | 
| 12 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.6556,"Persian IFEval":0.8340675477,"Persian MT-Bench":0.8418333333,"PerMMLU":0.6128538638,"PerCoR":0.7712,"Persian NLU":0.6833497104,"Persian NLG":0.1901206806}
         | 
| 13 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","Average":0.6549,"Persian IFEval":0.8370044053,"Persian MT-Bench":0.86175,"PerMMLU":0.6810513107,"PerCoR":0.825165033,"Persian NLU":0.6361186163,"Persian NLG":0.0880621978}
         | 
| 14 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","Average":0.6458,"Persian IFEval":0.8311306902,"Persian MT-Bench":0.8600833333,"PerMMLU":0.5908047576,"PerCoR":0.8241,"Persian NLU":0.6752949557,"Persian NLG":0.0934094344}
         | 
|  | |
| 17 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","Average":0.6224,"Persian IFEval":0.803030303,"Persian MT-Bench":0.7632996633,"PerMMLU":0.5635086255,"PerCoR":0.7654,"Persian NLU":0.6714091535,"Persian NLG":0.1679338638}
         | 
| 18 | 
             
            {"Model Name":"Llama-3.3-70B-Instruct","thinking_method":"β","model_url":"https_google.com","parameters_count":"70600000000","source_type":"Open-Source","Average":0.613,"Persian IFEval":0.7125925926,"Persian MT-Bench":0.7172558923,"PerMMLU":0.5714086374,"PerCoR":0.7956,"Persian NLU":0.6800109206,"Persian NLG":0.2010896964}
         | 
| 19 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","Average":0.6098,"Persian IFEval":0.8438880707,"Persian MT-Bench":0.8219166667,"PerMMLU":0.5980651448,"PerCoR":0.798859772,"Persian NLU":0.4824528512,"Persian NLG":0.1137933652}
         | 
| 20 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","Average":0.6087,"Persian IFEval":0.8449039882,"Persian MT-Bench":0.7530833333,"PerMMLU":0.5958127565,"PerCoR":0.6962,"Persian NLU":0.628506628,"Persian NLG":0.1334687319}
         | 
| 21 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","Average":0.6008,"Persian IFEval":0.8149779736,"Persian MT-Bench":0.75125,"PerMMLU":0.5105376643,"PerCoR":0.7094,"Persian NLU":0.699116864,"Persian NLG":0.1196804312}
         | 
| 22 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","Average":0.5939,"Persian IFEval":0.8325508607,"Persian MT-Bench":0.7431271478,"PerMMLU":0.5097725534,"PerCoR":0.688,"Persian NLU":0.6255818412,"Persian NLG":0.164118288}
         | 
| 23 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","Average":0.5912,"Persian IFEval":0.8105726872,"Persian MT-Bench":0.7204545455,"PerMMLU":0.5139458858,"PerCoR":0.6958,"Persian NLU":0.6460328733,"Persian NLG":0.16056333}
         | 
| 24 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https_google.com","parameters_count":"109000000000","source_type":"Open-Source","Average":0.5737,"Persian IFEval":0.7897058824,"Persian MT-Bench":0.74175,"PerMMLU":0.5639563191,"PerCoR":0.7814,"Persian NLU":0.4086928082,"Persian NLG":0.1567965528}
         | 
| 25 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https_google.com","parameters_count":"104000000000","source_type":"Open-Source","Average":0.5705,"Persian IFEval":0.7007407407,"Persian MT-Bench":0.688,"PerMMLU":0.4800723378,"PerCoR":0.7364,"Persian NLU":0.6297634971,"Persian NLG":0.1880477876}
         | 
| 26 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","Average":0.5576,"Persian IFEval":0.7526555387,"Persian MT-Bench":0.7290833333,"PerMMLU":0.4763231198,"PerCoR":0.6894,"Persian NLU":0.5661558794,"Persian NLG":0.1319091735}
         | 
| 27 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","Average":0.5546,"Persian IFEval":0.825256975,"Persian MT-Bench":0.7585,"PerMMLU":0.5440356745,"PerCoR":0.7160432086,"Persian NLU":0.3749414991,"Persian NLG":0.1089333827}
         | 
    	
        leaderboard/boards_data/extractive-qa_PQuAD.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":21.8957345972,"extractive-qa_PQuAD_f1":0.5899280585,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":29.8578199052,"extractive-qa_PQuAD_f1":0.6483891649,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":51.6587677725,"extractive-qa_PQuAD_f1":0.7997294818,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":null,"extractive-qa_PQuAD_f1":null,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":16.2085308057,"extractive-qa_PQuAD_f1":0.5540542726,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":null,"extractive-qa_PQuAD_f1":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":24.9289099526,"extractive-qa_PQuAD_f1":0.5952537387,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":11.9431279621,"extractive-qa_PQuAD_f1":0.5054306037,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":12.0379146919,"extractive-qa_PQuAD_f1":0.5152644082,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":1.5165876777,"extractive-qa_PQuAD_f1":0.3221621809,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":13.0805687204,"extractive-qa_PQuAD_f1":0.5111951184,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":null,"extractive-qa_PQuAD_f1":null,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":21.8957345972,"extractive-qa_PQuAD_f1":0.5899280585,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":42.0853080569,"extractive-qa_PQuAD_f1":0.747356805,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":29.8578199052,"extractive-qa_PQuAD_f1":0.6483891649,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":51.6587677725,"extractive-qa_PQuAD_f1":0.7997294818,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":42.9383886256,"extractive-qa_PQuAD_f1":0.7674489336,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":41.6113744076,"extractive-qa_PQuAD_f1":0.7625286761,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":37.345971564,"extractive-qa_PQuAD_f1":0.7251201928,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":null,"extractive-qa_PQuAD_f1":null,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":16.2085308057,"extractive-qa_PQuAD_f1":0.5540542726,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":null,"extractive-qa_PQuAD_f1":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":24.9289099526,"extractive-qa_PQuAD_f1":0.5952537387,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":11.9431279621,"extractive-qa_PQuAD_f1":0.5054306037,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":12.0379146919,"extractive-qa_PQuAD_f1":0.5152644082,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":16.5876777251,"extractive-qa_PQuAD_f1":0.5291313789,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","extractive-qa_PQuAD_exact_match":1.5165876777,"extractive-qa_PQuAD_f1":0.3221621809,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":13.0805687204,"extractive-qa_PQuAD_f1":0.5111951184,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","extractive-qa_PQuAD_exact_match":null,"extractive-qa_PQuAD_f1":null,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/ifeval.jsonl
    CHANGED
    
    | @@ -1,22 +1,27 @@ | |
| 1 | 
             
            {"Model Name":"o3","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8967032967,"strict_instruction_accuracy":0.926035503,"loose_prompt_accuracy":0.9076923077,"loose_instruction_accuracy":0.9378698225,"strict_combination_category":0.859375,"strict_detectable_content_category":0.9565217391,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.965034965,"strict_language_category":1.0,"strict_length_constraints_category":0.8852459016,"strict_punctuation_category":0.95,"strict_startend_category":0.9682539683,"loose_combination_category":0.875,"loose_detectable_content_category":0.9565217391,"loose_detectable_format_category":0.8979591837,"loose_keywords_category":0.979020979,"loose_language_category":1.0,"loose_length_constraints_category":0.9016393443,"loose_punctuation_category":1.0,"loose_startend_category":0.9682539683}
         | 
|  | |
|  | |
| 2 | 
             
            {"Model Name":"gemini-2.5-pro","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8464912281,"strict_instruction_accuracy":0.8911764706,"loose_prompt_accuracy":0.8815789474,"loose_instruction_accuracy":0.9191176471,"strict_combination_category":0.8461538462,"strict_detectable_content_category":0.9777777778,"strict_detectable_format_category":0.8707482993,"strict_keywords_category":0.875862069,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.8211382114,"strict_punctuation_category":1.0,"strict_startend_category":0.9523809524,"loose_combination_category":0.8461538462,"loose_detectable_content_category":0.9777777778,"loose_detectable_format_category":0.8707482993,"loose_keywords_category":0.9172413793,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.9268292683,"loose_punctuation_category":1.0,"loose_startend_category":0.9523809524}
         | 
| 3 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8336980306,"strict_instruction_accuracy":0.8810572687,"loose_prompt_accuracy":0.8774617068,"loose_instruction_accuracy":0.9148311307,"strict_combination_category":0.8307692308,"strict_detectable_content_category":0.9782608696,"strict_detectable_format_category":0.8775510204,"strict_keywords_category":0.8965517241,"strict_language_category":1.0,"strict_length_constraints_category":0.756097561,"strict_punctuation_category":0.9508196721,"strict_startend_category":0.9523809524,"loose_combination_category":0.8461538462,"loose_detectable_content_category":0.9782608696,"loose_detectable_format_category":0.8775510204,"loose_keywords_category":0.9448275862,"loose_language_category":1.0,"loose_length_constraints_category":0.8536585366,"loose_punctuation_category":0.9836065574,"loose_startend_category":0.9682539683}
         | 
| 4 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.836689038,"strict_instruction_accuracy":0.8796992481,"loose_prompt_accuracy":0.8680089485,"loose_instruction_accuracy":0.9067669173,"strict_combination_category":0.8,"strict_detectable_content_category":0.9772727273,"strict_detectable_format_category":0.8689655172,"strict_keywords_category":0.8623188406,"strict_language_category":0.935483871,"strict_length_constraints_category":0.8166666667,"strict_punctuation_category":0.9666666667,"strict_startend_category":0.9677419355,"loose_combination_category":0.8307692308,"loose_detectable_content_category":0.9772727273,"loose_detectable_format_category":0.875862069,"loose_keywords_category":0.9130434783,"loose_language_category":0.935483871,"loose_length_constraints_category":0.8666666667,"loose_punctuation_category":1.0,"loose_startend_category":0.9677419355}
         | 
|  | |
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8140043764,"strict_instruction_accuracy":0.8634361233,"loose_prompt_accuracy":0.8512035011,"loose_instruction_accuracy":0.8942731278,"strict_combination_category":0.7846153846,"strict_detectable_content_category":0.9347826087,"strict_detectable_format_category":0.8911564626,"strict_keywords_category":0.8482758621,"strict_language_category":1.0,"strict_length_constraints_category":0.7804878049,"strict_punctuation_category":0.868852459,"strict_startend_category":0.9523809524,"loose_combination_category":0.8153846154,"loose_detectable_content_category":0.9347826087,"loose_detectable_format_category":0.9047619048,"loose_keywords_category":0.9103448276,"loose_language_category":1.0,"loose_length_constraints_category":0.837398374,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.9523809524}
         | 
| 6 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.7916666667,"strict_instruction_accuracy":0.8497790869,"loose_prompt_accuracy":0.8245614035,"loose_instruction_accuracy":0.8777614138,"strict_combination_category":0.6875,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.9047619048,"strict_keywords_category":0.7916666667,"strict_language_category":1.0,"strict_length_constraints_category":0.7642276423,"strict_punctuation_category":0.9672131148,"strict_startend_category":0.9523809524,"loose_combination_category":0.703125,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.9047619048,"loose_keywords_category":0.8541666667,"loose_language_category":1.0,"loose_length_constraints_category":0.837398374,"loose_punctuation_category":0.9672131148,"loose_startend_category":0.9523809524}
         | 
|  | |
| 7 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7802197802,"strict_instruction_accuracy":0.8438880707,"loose_prompt_accuracy":0.832967033,"loose_instruction_accuracy":0.88365243,"strict_combination_category":0.8461538462,"strict_detectable_content_category":0.9347826087,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.7793103448,"strict_language_category":1.0,"strict_length_constraints_category":0.7685950413,"strict_punctuation_category":0.8032786885,"strict_startend_category":0.9047619048,"loose_combination_category":0.8461538462,"loose_detectable_content_category":0.9347826087,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.8482758621,"loose_language_category":1.0,"loose_length_constraints_category":0.8429752066,"loose_punctuation_category":0.868852459,"loose_startend_category":0.9365079365}
         | 
| 8 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.7921225383,"strict_instruction_accuracy":0.8414096916,"loose_prompt_accuracy":0.8161925602,"loose_instruction_accuracy":0.8649045521,"strict_combination_category":0.7230769231,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.8367346939,"strict_keywords_category":0.8137931034,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.7642276423,"strict_punctuation_category":0.9672131148,"strict_startend_category":0.9523809524,"loose_combination_category":0.7384615385,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.8367346939,"loose_keywords_category":0.875862069,"loose_language_category":1.0,"loose_length_constraints_category":0.8048780488,"loose_punctuation_category":0.9672131148,"loose_startend_category":0.9523809524}
         | 
| 9 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7702407002,"strict_instruction_accuracy":0.8370044053,"loose_prompt_accuracy":0.8140043764,"loose_instruction_accuracy":0.8707782673,"strict_combination_category":0.7384615385,"strict_detectable_content_category":0.9782608696,"strict_detectable_format_category":0.8503401361,"strict_keywords_category":0.7862068966,"strict_language_category":1.0,"strict_length_constraints_category":0.756097561,"strict_punctuation_category":0.9836065574,"strict_startend_category":0.8571428571,"loose_combination_category":0.7538461538,"loose_detectable_content_category":0.9782608696,"loose_detectable_format_category":0.8571428571,"loose_keywords_category":0.8551724138,"loose_language_category":1.0,"loose_length_constraints_category":0.8048780488,"loose_punctuation_category":1.0,"loose_startend_category":0.9206349206}
         | 
| 10 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.772428884,"strict_instruction_accuracy":0.8340675477,"loose_prompt_accuracy":0.7986870897,"loose_instruction_accuracy":0.8575624082,"strict_combination_category":0.6923076923,"strict_detectable_content_category":0.847826087,"strict_detectable_format_category":0.8775510204,"strict_keywords_category":0.8344827586,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.7154471545,"strict_punctuation_category":0.9180327869,"strict_startend_category":0.9523809524,"loose_combination_category":0.7230769231,"loose_detectable_content_category":0.847826087,"loose_detectable_format_category":0.8843537415,"loose_keywords_category":0.8827586207,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.756097561,"loose_punctuation_category":0.9344262295,"loose_startend_category":0.9523809524}
         | 
| 11 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","strict_prompt_accuracy":0.7662037037,"strict_instruction_accuracy":0.8325508607,"loose_prompt_accuracy":0.8078703704,"loose_instruction_accuracy":0.8638497653,"strict_combination_category":0.6349206349,"strict_detectable_content_category":0.8837209302,"strict_detectable_format_category":0.9136690647,"strict_keywords_category":0.7954545455,"strict_language_category":0.9655172414,"strict_length_constraints_category":0.7192982456,"strict_punctuation_category":0.9655172414,"strict_startend_category":0.9180327869,"loose_combination_category":0.7936507937,"loose_detectable_content_category":0.8837209302,"loose_detectable_format_category":0.928057554,"loose_keywords_category":0.8257575758,"loose_language_category":0.9655172414,"loose_length_constraints_category":0.7543859649,"loose_punctuation_category":0.9655172414,"loose_startend_category":0.9180327869}
         | 
| 12 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7702407002,"strict_instruction_accuracy":0.8311306902,"loose_prompt_accuracy":0.8205689278,"loose_instruction_accuracy":0.8693098385,"strict_combination_category":0.7846153846,"strict_detectable_content_category":1.0,"strict_detectable_format_category":0.8503401361,"strict_keywords_category":0.8,"strict_language_category":1.0,"strict_length_constraints_category":0.6666666667,"strict_punctuation_category":0.9672131148,"strict_startend_category":0.8888888889,"loose_combination_category":0.8153846154,"loose_detectable_content_category":1.0,"loose_detectable_format_category":0.8639455782,"loose_keywords_category":0.8551724138,"loose_language_category":1.0,"loose_length_constraints_category":0.7479674797,"loose_punctuation_category":0.9836065574,"loose_startend_category":0.9365079365}
         | 
| 13 | 
            -
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.772428884,"strict_instruction_accuracy":0.8296622614,"loose_prompt_accuracy":0.8140043764,"loose_instruction_accuracy":0.8649045521,"strict_combination_category":0.8,"strict_detectable_content_category":0.9782608696,"strict_detectable_format_category":0.8911564626,"strict_keywords_category":0.7793103448,"strict_language_category":1.0,"strict_length_constraints_category":0.6829268293,"strict_punctuation_category":0.8360655738,"strict_startend_category":0.9206349206,"loose_combination_category":0.8153846154,"loose_detectable_content_category":0.9782608696,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.8344827586,"loose_language_category":1.0,"loose_length_constraints_category":0.7479674797,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.9365079365}
         | 
| 14 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","strict_prompt_accuracy":0.7636761488,"strict_instruction_accuracy":0.8296622614,"loose_prompt_accuracy":0.8052516411,"loose_instruction_accuracy":0.8634361233,"strict_combination_category":0.7230769231,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.8095238095,"strict_keywords_category":0.7931034483,"strict_language_category":1.0,"strict_length_constraints_category":0.7886178862,"strict_punctuation_category":0.9836065574,"strict_startend_category":0.873015873,"loose_combination_category":0.7230769231,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.8095238095,"loose_keywords_category":0.875862069,"loose_language_category":1.0,"loose_length_constraints_category":0.8780487805,"loose_punctuation_category":0.9836065574,"loose_startend_category":0.873015873}
         | 
|  | |
| 15 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.761487965,"strict_instruction_accuracy":0.825256975,"loose_prompt_accuracy":0.7877461707,"loose_instruction_accuracy":0.8516886931,"strict_combination_category":0.7384615385,"strict_detectable_content_category":0.9565217391,"strict_detectable_format_category":0.8571428571,"strict_keywords_category":0.8413793103,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6097560976,"strict_punctuation_category":1.0,"strict_startend_category":0.8888888889,"loose_combination_category":0.7538461538,"loose_detectable_content_category":0.9565217391,"loose_detectable_format_category":0.8775510204,"loose_keywords_category":0.875862069,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.6666666667,"loose_punctuation_category":1.0,"loose_startend_category":0.9206349206}
         | 
| 16 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","strict_prompt_accuracy":0.7396061269,"strict_instruction_accuracy":0.8149779736,"loose_prompt_accuracy":0.7877461707,"loose_instruction_accuracy":0.8516886931,"strict_combination_category":0.6923076923,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.8911564626,"strict_keywords_category":0.7586206897,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.7479674797,"strict_punctuation_category":0.8032786885,"strict_startend_category":0.8888888889,"loose_combination_category":0.6923076923,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.8911564626,"loose_keywords_category":0.8344827586,"loose_language_category":1.0,"loose_length_constraints_category":0.8292682927,"loose_punctuation_category":0.8360655738,"loose_startend_category":0.9047619048}
         | 
| 17 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","strict_prompt_accuracy":0.7483588621,"strict_instruction_accuracy":0.8105726872,"loose_prompt_accuracy":0.7899343545,"loose_instruction_accuracy":0.845814978,"strict_combination_category":0.7230769231,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.7724137931,"strict_language_category":0.935483871,"strict_length_constraints_category":0.7479674797,"strict_punctuation_category":0.7049180328,"strict_startend_category":0.8888888889,"loose_combination_category":0.7692307692,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.8413793103,"loose_language_category":0.935483871,"loose_length_constraints_category":0.7642276423,"loose_punctuation_category":0.7540983607,"loose_startend_category":0.9523809524}
         | 
| 18 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","strict_prompt_accuracy":0.7342342342,"strict_instruction_accuracy":0.803030303,"loose_prompt_accuracy":0.786036036,"loose_instruction_accuracy":0.846969697,"strict_combination_category":0.625,"strict_detectable_content_category":0.9111111111,"strict_detectable_format_category":0.8951048951,"strict_keywords_category":0.7785714286,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6140350877,"strict_punctuation_category":0.9333333333,"strict_startend_category":0.8888888889,"loose_combination_category":0.6875,"loose_detectable_content_category":0.9111111111,"loose_detectable_format_category":0.9090909091,"loose_keywords_category":0.85,"loose_language_category":1.0,"loose_length_constraints_category":0.6666666667,"loose_punctuation_category":0.95,"loose_startend_category":0.9682539683}
         | 
| 19 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.7308533917,"strict_instruction_accuracy":0.8017621145,"loose_prompt_accuracy":0.772428884,"loose_instruction_accuracy":0.8355359765,"strict_combination_category":0.7384615385,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.843537415,"strict_keywords_category":0.7379310345,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6666666667,"strict_punctuation_category":0.9016393443,"strict_startend_category":0.9365079365,"loose_combination_category":0.7538461538,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.8775510204,"loose_keywords_category":0.7793103448,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7398373984,"loose_punctuation_category":0.9344262295,"loose_startend_category":0.9365079365}
         | 
|  | |
| 20 | 
             
            {"Model Name":"gpt-4.1-nano","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.6827133479,"strict_instruction_accuracy":0.7577092511,"loose_prompt_accuracy":0.7199124726,"loose_instruction_accuracy":0.7885462555,"strict_combination_category":0.5846153846,"strict_detectable_content_category":0.7608695652,"strict_detectable_format_category":0.8027210884,"strict_keywords_category":0.7793103448,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6829268293,"strict_punctuation_category":0.7704918033,"strict_startend_category":0.8095238095,"loose_combination_category":0.6153846154,"loose_detectable_content_category":0.7608695652,"loose_detectable_format_category":0.8095238095,"loose_keywords_category":0.8344827586,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7154471545,"loose_punctuation_category":0.8360655738,"loose_startend_category":0.8412698413}
         | 
| 21 | 
             
            {"Model Name":"Qwen3-4B","thinking_method":"β","model_url":"https_google.com","parameters_count":"4020000000","source_type":"Open-Source","strict_prompt_accuracy":0.6717724289,"strict_instruction_accuracy":0.7577092511,"loose_prompt_accuracy":0.7264770241,"loose_instruction_accuracy":0.798825257,"strict_combination_category":0.5384615385,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.9047619048,"strict_keywords_category":0.7172413793,"strict_language_category":0.8387096774,"strict_length_constraints_category":0.6666666667,"strict_punctuation_category":0.8196721311,"strict_startend_category":0.7142857143,"loose_combination_category":0.5692307692,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.7931034483,"loose_language_category":0.8709677419,"loose_length_constraints_category":0.7235772358,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.746031746}
         | 
| 22 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","strict_prompt_accuracy":0.6644144144,"strict_instruction_accuracy":0.7526555387,"loose_prompt_accuracy":0.7274774775,"loose_instruction_accuracy":0.7996965099,"strict_combination_category":0.6153846154,"strict_detectable_content_category":0.8444444444,"strict_detectable_format_category":0.8014184397,"strict_keywords_category":0.7642857143,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.641025641,"strict_punctuation_category":0.7333333333,"strict_startend_category":0.8166666667,"loose_combination_category":0.6615384615,"loose_detectable_content_category":0.8444444444,"loose_detectable_format_category":0.8156028369,"loose_keywords_category":0.8071428571,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7606837607,"loose_punctuation_category":0.8,"loose_startend_category":0.85}
         | 
|  | |
| 1 | 
             
            {"Model Name":"o3","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8967032967,"strict_instruction_accuracy":0.926035503,"loose_prompt_accuracy":0.9076923077,"loose_instruction_accuracy":0.9378698225,"strict_combination_category":0.859375,"strict_detectable_content_category":0.9565217391,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.965034965,"strict_language_category":1.0,"strict_length_constraints_category":0.8852459016,"strict_punctuation_category":0.95,"strict_startend_category":0.9682539683,"loose_combination_category":0.875,"loose_detectable_content_category":0.9565217391,"loose_detectable_format_category":0.8979591837,"loose_keywords_category":0.979020979,"loose_language_category":1.0,"loose_length_constraints_category":0.9016393443,"loose_punctuation_category":1.0,"loose_startend_category":0.9682539683}
         | 
| 2 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.875273523,"strict_instruction_accuracy":0.9104258443,"loose_prompt_accuracy":0.8927789934,"loose_instruction_accuracy":0.9251101322,"strict_combination_category":0.7230769231,"strict_detectable_content_category":1.0,"strict_detectable_format_category":0.925170068,"strict_keywords_category":0.924137931,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.9024390244,"strict_punctuation_category":0.9508196721,"strict_startend_category":0.9206349206,"loose_combination_category":0.7384615385,"loose_detectable_content_category":1.0,"loose_detectable_format_category":0.925170068,"loose_keywords_category":0.9517241379,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.9105691057,"loose_punctuation_category":1.0,"loose_startend_category":0.9365079365}
         | 
| 3 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8577680525,"strict_instruction_accuracy":0.8972099853,"loose_prompt_accuracy":0.8840262582,"loose_instruction_accuracy":0.9177679883,"strict_combination_category":0.7076923077,"strict_detectable_content_category":0.9565217391,"strict_detectable_format_category":0.8843537415,"strict_keywords_category":0.924137931,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.8943089431,"strict_punctuation_category":0.9508196721,"strict_startend_category":0.9365079365,"loose_combination_category":0.7230769231,"loose_detectable_content_category":0.9565217391,"loose_detectable_format_category":0.8843537415,"loose_keywords_category":0.9448275862,"loose_language_category":1.0,"loose_length_constraints_category":0.9430894309,"loose_punctuation_category":1.0,"loose_startend_category":0.9365079365}
         | 
| 4 | 
             
            {"Model Name":"gemini-2.5-pro","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8464912281,"strict_instruction_accuracy":0.8911764706,"loose_prompt_accuracy":0.8815789474,"loose_instruction_accuracy":0.9191176471,"strict_combination_category":0.8461538462,"strict_detectable_content_category":0.9777777778,"strict_detectable_format_category":0.8707482993,"strict_keywords_category":0.875862069,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.8211382114,"strict_punctuation_category":1.0,"strict_startend_category":0.9523809524,"loose_combination_category":0.8461538462,"loose_detectable_content_category":0.9777777778,"loose_detectable_format_category":0.8707482993,"loose_keywords_category":0.9172413793,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.9268292683,"loose_punctuation_category":1.0,"loose_startend_category":0.9523809524}
         | 
| 5 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8336980306,"strict_instruction_accuracy":0.8810572687,"loose_prompt_accuracy":0.8774617068,"loose_instruction_accuracy":0.9148311307,"strict_combination_category":0.8307692308,"strict_detectable_content_category":0.9782608696,"strict_detectable_format_category":0.8775510204,"strict_keywords_category":0.8965517241,"strict_language_category":1.0,"strict_length_constraints_category":0.756097561,"strict_punctuation_category":0.9508196721,"strict_startend_category":0.9523809524,"loose_combination_category":0.8461538462,"loose_detectable_content_category":0.9782608696,"loose_detectable_format_category":0.8775510204,"loose_keywords_category":0.9448275862,"loose_language_category":1.0,"loose_length_constraints_category":0.8536585366,"loose_punctuation_category":0.9836065574,"loose_startend_category":0.9682539683}
         | 
| 6 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.836689038,"strict_instruction_accuracy":0.8796992481,"loose_prompt_accuracy":0.8680089485,"loose_instruction_accuracy":0.9067669173,"strict_combination_category":0.8,"strict_detectable_content_category":0.9772727273,"strict_detectable_format_category":0.8689655172,"strict_keywords_category":0.8623188406,"strict_language_category":0.935483871,"strict_length_constraints_category":0.8166666667,"strict_punctuation_category":0.9666666667,"strict_startend_category":0.9677419355,"loose_combination_category":0.8307692308,"loose_detectable_content_category":0.9772727273,"loose_detectable_format_category":0.875862069,"loose_keywords_category":0.9130434783,"loose_language_category":0.935483871,"loose_length_constraints_category":0.8666666667,"loose_punctuation_category":1.0,"loose_startend_category":0.9677419355}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","strict_prompt_accuracy":0.8197802198,"strict_instruction_accuracy":0.8702064897,"loose_prompt_accuracy":0.8615384615,"loose_instruction_accuracy":0.9041297935,"strict_combination_category":0.8,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.9452054795,"strict_keywords_category":0.8344827586,"strict_language_category":0.935483871,"strict_length_constraints_category":0.8016528926,"strict_punctuation_category":0.8360655738,"strict_startend_category":0.9523809524,"loose_combination_category":0.8153846154,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.9520547945,"loose_keywords_category":0.8965517241,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.8595041322,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.9682539683}
         | 
| 8 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.8140043764,"strict_instruction_accuracy":0.8634361233,"loose_prompt_accuracy":0.8512035011,"loose_instruction_accuracy":0.8942731278,"strict_combination_category":0.7846153846,"strict_detectable_content_category":0.9347826087,"strict_detectable_format_category":0.8911564626,"strict_keywords_category":0.8482758621,"strict_language_category":1.0,"strict_length_constraints_category":0.7804878049,"strict_punctuation_category":0.868852459,"strict_startend_category":0.9523809524,"loose_combination_category":0.8153846154,"loose_detectable_content_category":0.9347826087,"loose_detectable_format_category":0.9047619048,"loose_keywords_category":0.9103448276,"loose_language_category":1.0,"loose_length_constraints_category":0.837398374,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.9523809524}
         | 
| 9 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.7916666667,"strict_instruction_accuracy":0.8497790869,"loose_prompt_accuracy":0.8245614035,"loose_instruction_accuracy":0.8777614138,"strict_combination_category":0.6875,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.9047619048,"strict_keywords_category":0.7916666667,"strict_language_category":1.0,"strict_length_constraints_category":0.7642276423,"strict_punctuation_category":0.9672131148,"strict_startend_category":0.9523809524,"loose_combination_category":0.703125,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.9047619048,"loose_keywords_category":0.8541666667,"loose_language_category":1.0,"loose_length_constraints_category":0.837398374,"loose_punctuation_category":0.9672131148,"loose_startend_category":0.9523809524}
         | 
| 10 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7846153846,"strict_instruction_accuracy":0.8449039882,"loose_prompt_accuracy":0.8131868132,"loose_instruction_accuracy":0.8670605613,"strict_combination_category":0.7076923077,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.8671328671,"strict_language_category":1.0,"strict_length_constraints_category":0.7704918033,"strict_punctuation_category":0.8,"strict_startend_category":0.8888888889,"loose_combination_category":0.7076923077,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.8979591837,"loose_keywords_category":0.9090909091,"loose_language_category":1.0,"loose_length_constraints_category":0.8196721311,"loose_punctuation_category":0.8333333333,"loose_startend_category":0.9047619048}
         | 
| 11 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7802197802,"strict_instruction_accuracy":0.8438880707,"loose_prompt_accuracy":0.832967033,"loose_instruction_accuracy":0.88365243,"strict_combination_category":0.8461538462,"strict_detectable_content_category":0.9347826087,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.7793103448,"strict_language_category":1.0,"strict_length_constraints_category":0.7685950413,"strict_punctuation_category":0.8032786885,"strict_startend_category":0.9047619048,"loose_combination_category":0.8461538462,"loose_detectable_content_category":0.9347826087,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.8482758621,"loose_language_category":1.0,"loose_length_constraints_category":0.8429752066,"loose_punctuation_category":0.868852459,"loose_startend_category":0.9365079365}
         | 
| 12 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.7921225383,"strict_instruction_accuracy":0.8414096916,"loose_prompt_accuracy":0.8161925602,"loose_instruction_accuracy":0.8649045521,"strict_combination_category":0.7230769231,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.8367346939,"strict_keywords_category":0.8137931034,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.7642276423,"strict_punctuation_category":0.9672131148,"strict_startend_category":0.9523809524,"loose_combination_category":0.7384615385,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.8367346939,"loose_keywords_category":0.875862069,"loose_language_category":1.0,"loose_length_constraints_category":0.8048780488,"loose_punctuation_category":0.9672131148,"loose_startend_category":0.9523809524}
         | 
| 13 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7702407002,"strict_instruction_accuracy":0.8370044053,"loose_prompt_accuracy":0.8140043764,"loose_instruction_accuracy":0.8707782673,"strict_combination_category":0.7384615385,"strict_detectable_content_category":0.9782608696,"strict_detectable_format_category":0.8503401361,"strict_keywords_category":0.7862068966,"strict_language_category":1.0,"strict_length_constraints_category":0.756097561,"strict_punctuation_category":0.9836065574,"strict_startend_category":0.8571428571,"loose_combination_category":0.7538461538,"loose_detectable_content_category":0.9782608696,"loose_detectable_format_category":0.8571428571,"loose_keywords_category":0.8551724138,"loose_language_category":1.0,"loose_length_constraints_category":0.8048780488,"loose_punctuation_category":1.0,"loose_startend_category":0.9206349206}
         | 
| 14 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.772428884,"strict_instruction_accuracy":0.8340675477,"loose_prompt_accuracy":0.7986870897,"loose_instruction_accuracy":0.8575624082,"strict_combination_category":0.6923076923,"strict_detectable_content_category":0.847826087,"strict_detectable_format_category":0.8775510204,"strict_keywords_category":0.8344827586,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.7154471545,"strict_punctuation_category":0.9180327869,"strict_startend_category":0.9523809524,"loose_combination_category":0.7230769231,"loose_detectable_content_category":0.847826087,"loose_detectable_format_category":0.8843537415,"loose_keywords_category":0.8827586207,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.756097561,"loose_punctuation_category":0.9344262295,"loose_startend_category":0.9523809524}
         | 
| 15 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","strict_prompt_accuracy":0.7662037037,"strict_instruction_accuracy":0.8325508607,"loose_prompt_accuracy":0.8078703704,"loose_instruction_accuracy":0.8638497653,"strict_combination_category":0.6349206349,"strict_detectable_content_category":0.8837209302,"strict_detectable_format_category":0.9136690647,"strict_keywords_category":0.7954545455,"strict_language_category":0.9655172414,"strict_length_constraints_category":0.7192982456,"strict_punctuation_category":0.9655172414,"strict_startend_category":0.9180327869,"loose_combination_category":0.7936507937,"loose_detectable_content_category":0.8837209302,"loose_detectable_format_category":0.928057554,"loose_keywords_category":0.8257575758,"loose_language_category":0.9655172414,"loose_length_constraints_category":0.7543859649,"loose_punctuation_category":0.9655172414,"loose_startend_category":0.9180327869}
         | 
| 16 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7702407002,"strict_instruction_accuracy":0.8311306902,"loose_prompt_accuracy":0.8205689278,"loose_instruction_accuracy":0.8693098385,"strict_combination_category":0.7846153846,"strict_detectable_content_category":1.0,"strict_detectable_format_category":0.8503401361,"strict_keywords_category":0.8,"strict_language_category":1.0,"strict_length_constraints_category":0.6666666667,"strict_punctuation_category":0.9672131148,"strict_startend_category":0.8888888889,"loose_combination_category":0.8153846154,"loose_detectable_content_category":1.0,"loose_detectable_format_category":0.8639455782,"loose_keywords_category":0.8551724138,"loose_language_category":1.0,"loose_length_constraints_category":0.7479674797,"loose_punctuation_category":0.9836065574,"loose_startend_category":0.9365079365}
         | 
|  | |
| 17 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","strict_prompt_accuracy":0.7636761488,"strict_instruction_accuracy":0.8296622614,"loose_prompt_accuracy":0.8052516411,"loose_instruction_accuracy":0.8634361233,"strict_combination_category":0.7230769231,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.8095238095,"strict_keywords_category":0.7931034483,"strict_language_category":1.0,"strict_length_constraints_category":0.7886178862,"strict_punctuation_category":0.9836065574,"strict_startend_category":0.873015873,"loose_combination_category":0.7230769231,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.8095238095,"loose_keywords_category":0.875862069,"loose_language_category":1.0,"loose_length_constraints_category":0.8780487805,"loose_punctuation_category":0.9836065574,"loose_startend_category":0.873015873}
         | 
| 18 | 
            +
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.772428884,"strict_instruction_accuracy":0.8296622614,"loose_prompt_accuracy":0.8140043764,"loose_instruction_accuracy":0.8649045521,"strict_combination_category":0.8,"strict_detectable_content_category":0.9782608696,"strict_detectable_format_category":0.8911564626,"strict_keywords_category":0.7793103448,"strict_language_category":1.0,"strict_length_constraints_category":0.6829268293,"strict_punctuation_category":0.8360655738,"strict_startend_category":0.9206349206,"loose_combination_category":0.8153846154,"loose_detectable_content_category":0.9782608696,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.8344827586,"loose_language_category":1.0,"loose_length_constraints_category":0.7479674797,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.9365079365}
         | 
| 19 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.761487965,"strict_instruction_accuracy":0.825256975,"loose_prompt_accuracy":0.7877461707,"loose_instruction_accuracy":0.8516886931,"strict_combination_category":0.7384615385,"strict_detectable_content_category":0.9565217391,"strict_detectable_format_category":0.8571428571,"strict_keywords_category":0.8413793103,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6097560976,"strict_punctuation_category":1.0,"strict_startend_category":0.8888888889,"loose_combination_category":0.7538461538,"loose_detectable_content_category":0.9565217391,"loose_detectable_format_category":0.8775510204,"loose_keywords_category":0.875862069,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.6666666667,"loose_punctuation_category":1.0,"loose_startend_category":0.9206349206}
         | 
| 20 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","strict_prompt_accuracy":0.7396061269,"strict_instruction_accuracy":0.8149779736,"loose_prompt_accuracy":0.7877461707,"loose_instruction_accuracy":0.8516886931,"strict_combination_category":0.6923076923,"strict_detectable_content_category":0.9130434783,"strict_detectable_format_category":0.8911564626,"strict_keywords_category":0.7586206897,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.7479674797,"strict_punctuation_category":0.8032786885,"strict_startend_category":0.8888888889,"loose_combination_category":0.6923076923,"loose_detectable_content_category":0.9130434783,"loose_detectable_format_category":0.8911564626,"loose_keywords_category":0.8344827586,"loose_language_category":1.0,"loose_length_constraints_category":0.8292682927,"loose_punctuation_category":0.8360655738,"loose_startend_category":0.9047619048}
         | 
| 21 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","strict_prompt_accuracy":0.7483588621,"strict_instruction_accuracy":0.8105726872,"loose_prompt_accuracy":0.7899343545,"loose_instruction_accuracy":0.845814978,"strict_combination_category":0.7230769231,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.8979591837,"strict_keywords_category":0.7724137931,"strict_language_category":0.935483871,"strict_length_constraints_category":0.7479674797,"strict_punctuation_category":0.7049180328,"strict_startend_category":0.8888888889,"loose_combination_category":0.7692307692,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.8413793103,"loose_language_category":0.935483871,"loose_length_constraints_category":0.7642276423,"loose_punctuation_category":0.7540983607,"loose_startend_category":0.9523809524}
         | 
| 22 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","strict_prompt_accuracy":0.7342342342,"strict_instruction_accuracy":0.803030303,"loose_prompt_accuracy":0.786036036,"loose_instruction_accuracy":0.846969697,"strict_combination_category":0.625,"strict_detectable_content_category":0.9111111111,"strict_detectable_format_category":0.8951048951,"strict_keywords_category":0.7785714286,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6140350877,"strict_punctuation_category":0.9333333333,"strict_startend_category":0.8888888889,"loose_combination_category":0.6875,"loose_detectable_content_category":0.9111111111,"loose_detectable_format_category":0.9090909091,"loose_keywords_category":0.85,"loose_language_category":1.0,"loose_length_constraints_category":0.6666666667,"loose_punctuation_category":0.95,"loose_startend_category":0.9682539683}
         | 
| 23 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.7308533917,"strict_instruction_accuracy":0.8017621145,"loose_prompt_accuracy":0.772428884,"loose_instruction_accuracy":0.8355359765,"strict_combination_category":0.7384615385,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.843537415,"strict_keywords_category":0.7379310345,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6666666667,"strict_punctuation_category":0.9016393443,"strict_startend_category":0.9365079365,"loose_combination_category":0.7538461538,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.8775510204,"loose_keywords_category":0.7793103448,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7398373984,"loose_punctuation_category":0.9344262295,"loose_startend_category":0.9365079365}
         | 
| 24 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https_google.com","parameters_count":"109000000000","source_type":"Open-Source","strict_prompt_accuracy":0.7083333333,"strict_instruction_accuracy":0.7897058824,"loose_prompt_accuracy":0.7280701754,"loose_instruction_accuracy":0.8058823529,"strict_combination_category":0.5076923077,"strict_detectable_content_category":0.847826087,"strict_detectable_format_category":0.8775510204,"strict_keywords_category":0.7916666667,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.674796748,"strict_punctuation_category":0.868852459,"strict_startend_category":0.8888888889,"loose_combination_category":0.5230769231,"loose_detectable_content_category":0.847826087,"loose_detectable_format_category":0.8843537415,"loose_keywords_category":0.8263888889,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7073170732,"loose_punctuation_category":0.868852459,"loose_startend_category":0.8888888889}
         | 
| 25 | 
             
            {"Model Name":"gpt-4.1-nano","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","strict_prompt_accuracy":0.6827133479,"strict_instruction_accuracy":0.7577092511,"loose_prompt_accuracy":0.7199124726,"loose_instruction_accuracy":0.7885462555,"strict_combination_category":0.5846153846,"strict_detectable_content_category":0.7608695652,"strict_detectable_format_category":0.8027210884,"strict_keywords_category":0.7793103448,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.6829268293,"strict_punctuation_category":0.7704918033,"strict_startend_category":0.8095238095,"loose_combination_category":0.6153846154,"loose_detectable_content_category":0.7608695652,"loose_detectable_format_category":0.8095238095,"loose_keywords_category":0.8344827586,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7154471545,"loose_punctuation_category":0.8360655738,"loose_startend_category":0.8412698413}
         | 
| 26 | 
             
            {"Model Name":"Qwen3-4B","thinking_method":"β","model_url":"https_google.com","parameters_count":"4020000000","source_type":"Open-Source","strict_prompt_accuracy":0.6717724289,"strict_instruction_accuracy":0.7577092511,"loose_prompt_accuracy":0.7264770241,"loose_instruction_accuracy":0.798825257,"strict_combination_category":0.5384615385,"strict_detectable_content_category":0.8913043478,"strict_detectable_format_category":0.9047619048,"strict_keywords_category":0.7172413793,"strict_language_category":0.8387096774,"strict_length_constraints_category":0.6666666667,"strict_punctuation_category":0.8196721311,"strict_startend_category":0.7142857143,"loose_combination_category":0.5692307692,"loose_detectable_content_category":0.8913043478,"loose_detectable_format_category":0.9115646259,"loose_keywords_category":0.7931034483,"loose_language_category":0.8709677419,"loose_length_constraints_category":0.7235772358,"loose_punctuation_category":0.8852459016,"loose_startend_category":0.746031746}
         | 
| 27 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","strict_prompt_accuracy":0.6644144144,"strict_instruction_accuracy":0.7526555387,"loose_prompt_accuracy":0.7274774775,"loose_instruction_accuracy":0.7996965099,"strict_combination_category":0.6153846154,"strict_detectable_content_category":0.8444444444,"strict_detectable_format_category":0.8014184397,"strict_keywords_category":0.7642857143,"strict_language_category":0.9677419355,"strict_length_constraints_category":0.641025641,"strict_punctuation_category":0.7333333333,"strict_startend_category":0.8166666667,"loose_combination_category":0.6615384615,"loose_detectable_content_category":0.8444444444,"loose_detectable_format_category":0.8156028369,"loose_keywords_category":0.8071428571,"loose_language_category":0.9677419355,"loose_length_constraints_category":0.7606837607,"loose_punctuation_category":0.8,"loose_startend_category":0.85}
         | 
    	
        leaderboard/boards_data/keyword-extraction_SynKeywords.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.2115068728,"keyword-extraction_SynKeywords_precision_mean":0.1912410205,"keyword-extraction_SynKeywords_recall_mean":0.2483695652,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.229921048,"keyword-extraction_SynKeywords_precision_mean":0.21147343,"keyword-extraction_SynKeywords_recall_mean":0.2634963768,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.0860842686,"keyword-extraction_SynKeywords_precision_mean":0.0757882818,"keyword-extraction_SynKeywords_recall_mean":0.1065217391,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.2645652392,"keyword-extraction_SynKeywords_precision_mean":0.2349391249,"keyword-extraction_SynKeywords_recall_mean":0.3166666667,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.1217550899,"keyword-extraction_SynKeywords_precision_mean":0.1020894964,"keyword-extraction_SynKeywords_recall_mean":0.1608695652,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":null,"keyword-extraction_SynKeywords_precision_mean":null,"keyword-extraction_SynKeywords_recall_mean":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.2384077673,"keyword-extraction_SynKeywords_precision_mean":0.2041836259,"keyword-extraction_SynKeywords_recall_mean":0.3015398551,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.233766167,"keyword-extraction_SynKeywords_precision_mean":0.1893302534,"keyword-extraction_SynKeywords_recall_mean":0.3297101449,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1369232983,"keyword-extraction_SynKeywords_precision_mean":0.1117212542,"keyword-extraction_SynKeywords_recall_mean":0.1863224638,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.2568096145,"keyword-extraction_SynKeywords_precision_mean":0.2483731877,"keyword-extraction_SynKeywords_recall_mean":0.2765873016,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1942845429,"keyword-extraction_SynKeywords_precision_mean":0.168197784,"keyword-extraction_SynKeywords_recall_mean":0.2451992754,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1409784417,"keyword-extraction_SynKeywords_precision_mean":0.1216706248,"keyword-extraction_SynKeywords_recall_mean":0.1832427536,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.2115068728,"keyword-extraction_SynKeywords_precision_mean":0.1912410205,"keyword-extraction_SynKeywords_recall_mean":0.2483695652,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1297217026,"keyword-extraction_SynKeywords_precision_mean":0.1052290945,"keyword-extraction_SynKeywords_recall_mean":0.1816123188,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.229921048,"keyword-extraction_SynKeywords_precision_mean":0.21147343,"keyword-extraction_SynKeywords_recall_mean":0.2634963768,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.0860842686,"keyword-extraction_SynKeywords_precision_mean":0.0757882818,"keyword-extraction_SynKeywords_recall_mean":0.1065217391,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.1547160783,"keyword-extraction_SynKeywords_precision_mean":0.1275089966,"keyword-extraction_SynKeywords_recall_mean":0.2111413043,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.1186662307,"keyword-extraction_SynKeywords_precision_mean":0.1013265485,"keyword-extraction_SynKeywords_recall_mean":0.1581521739,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1443868036,"keyword-extraction_SynKeywords_precision_mean":0.1209283696,"keyword-extraction_SynKeywords_recall_mean":0.191576087,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.2645652392,"keyword-extraction_SynKeywords_precision_mean":0.2349391249,"keyword-extraction_SynKeywords_recall_mean":0.3166666667,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.1217550899,"keyword-extraction_SynKeywords_precision_mean":0.1020894964,"keyword-extraction_SynKeywords_recall_mean":0.1608695652,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":null,"keyword-extraction_SynKeywords_precision_mean":null,"keyword-extraction_SynKeywords_recall_mean":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.2384077673,"keyword-extraction_SynKeywords_precision_mean":0.2041836259,"keyword-extraction_SynKeywords_recall_mean":0.3015398551,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.233766167,"keyword-extraction_SynKeywords_precision_mean":0.1893302534,"keyword-extraction_SynKeywords_recall_mean":0.3297101449,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1369232983,"keyword-extraction_SynKeywords_precision_mean":0.1117212542,"keyword-extraction_SynKeywords_recall_mean":0.1863224638,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.0169533238,"keyword-extraction_SynKeywords_precision_mean":0.015422274,"keyword-extraction_SynKeywords_recall_mean":0.0206521739,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","keyword-extraction_SynKeywords_f1_mean":0.2568096145,"keyword-extraction_SynKeywords_precision_mean":0.2483731877,"keyword-extraction_SynKeywords_recall_mean":0.2765873016,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1942845429,"keyword-extraction_SynKeywords_precision_mean":0.168197784,"keyword-extraction_SynKeywords_recall_mean":0.2451992754,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","keyword-extraction_SynKeywords_f1_mean":0.1409784417,"keyword-extraction_SynKeywords_precision_mean":0.1216706248,"keyword-extraction_SynKeywords_recall_mean":0.1832427536,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/mt_bench.jsonl
    CHANGED
    
    | @@ -3,19 +3,24 @@ | |
| 3 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.7983539095,"score_mean":8.8122895623,"writing_score_w_mean":8.52,"writing_score_mean":8.5462962963,"roleplay_score_w_mean":8.2857142857,"roleplay_score_mean":8.2583333333,"reasoning_score_w_mean":8.4666666667,"reasoning_score_mean":8.3666666667,"math_score_w_mean":9.652173913,"math_score_mean":9.6,"coding_score_w_mean":8.8,"coding_score_mean":8.8,"extraction_score_w_mean":8.75,"extraction_score_mean":8.75,"stem_score_w_mean":8.7,"stem_score_mean":8.7,"humanities_score_w_mean":9.0,"humanities_score_mean":9.0,"persian_general_knowledge_score_w_mean":8.8148148148,"persian_general_knowledge_score_mean":8.9166666667,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1583333333}
         | 
| 4 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.7428571429,"score_mean":8.7325,"writing_score_w_mean":8.4074074074,"writing_score_mean":8.3833333333,"roleplay_score_w_mean":8.6071428571,"roleplay_score_mean":8.625,"reasoning_score_w_mean":9.0666666667,"reasoning_score_mean":8.9666666667,"math_score_w_mean":9.7826086957,"math_score_mean":9.75,"coding_score_w_mean":8.15,"coding_score_mean":8.15,"extraction_score_w_mean":8.45,"extraction_score_mean":8.45,"stem_score_w_mean":8.7,"stem_score_mean":8.7,"humanities_score_w_mean":9.1,"humanities_score_mean":9.1,"persian_general_knowledge_score_w_mean":7.7777777778,"persian_general_knowledge_score_mean":7.9333333333,"chatbot_rag_score_w_mean":9.3,"chatbot_rag_score_mean":9.2666666667}
         | 
| 5 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.7510204082,"score_mean":8.695,"writing_score_w_mean":8.5925925926,"writing_score_mean":8.625,"roleplay_score_w_mean":8.2142857143,"roleplay_score_mean":8.2166666667,"reasoning_score_w_mean":9.0666666667,"reasoning_score_mean":8.7833333333,"math_score_w_mean":9.7826086957,"math_score_mean":9.75,"coding_score_w_mean":7.85,"coding_score_mean":7.85,"extraction_score_w_mean":8.6,"extraction_score_mean":8.6,"stem_score_w_mean":8.55,"stem_score_mean":8.55,"humanities_score_w_mean":9.2,"humanities_score_mean":9.2,"persian_general_knowledge_score_w_mean":8.1481481481,"persian_general_knowledge_score_mean":8.0,"chatbot_rag_score_w_mean":9.3666666667,"chatbot_rag_score_mean":9.375}
         | 
|  | |
| 6 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","score_w_mean":8.5795918367,"score_mean":8.6175,"writing_score_w_mean":8.6296296296,"writing_score_mean":8.65,"roleplay_score_w_mean":8.1785714286,"roleplay_score_mean":8.225,"reasoning_score_w_mean":8.9,"reasoning_score_mean":8.7416666667,"math_score_w_mean":9.3043478261,"math_score_mean":9.2,"coding_score_w_mean":8.75,"coding_score_mean":8.75,"extraction_score_w_mean":8.5,"extraction_score_mean":8.5,"stem_score_w_mean":8.55,"stem_score_mean":8.55,"humanities_score_w_mean":9.15,"humanities_score_mean":9.15,"persian_general_knowledge_score_w_mean":6.8148148148,"persian_general_knowledge_score_mean":7.2416666667,"chatbot_rag_score_w_mean":9.2,"chatbot_rag_score_mean":9.1666666667}
         | 
| 7 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","score_w_mean":8.5102040816,"score_mean":8.6008333333,"writing_score_w_mean":8.4444444444,"writing_score_mean":8.4916666667,"roleplay_score_w_mean":8.9285714286,"roleplay_score_mean":8.9666666667,"reasoning_score_w_mean":8.3666666667,"reasoning_score_mean":8.3083333333,"math_score_w_mean":9.1304347826,"math_score_mean":9.0,"coding_score_w_mean":9.35,"coding_score_mean":9.35,"extraction_score_w_mean":8.65,"extraction_score_mean":8.65,"stem_score_w_mean":9.05,"stem_score_mean":9.05,"humanities_score_w_mean":9.25,"humanities_score_mean":9.25,"persian_general_knowledge_score_w_mean":5.0740740741,"persian_general_knowledge_score_mean":5.4916666667,"chatbot_rag_score_w_mean":9.4333333333,"chatbot_rag_score_mean":9.45}
         | 
| 8 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.3183673469,"score_mean":8.4183333333,"writing_score_w_mean":8.1111111111,"writing_score_mean":8.125,"roleplay_score_w_mean":8.0714285714,"roleplay_score_mean":8.0333333333,"reasoning_score_w_mean":8.1333333333,"reasoning_score_mean":8.0833333333,"math_score_w_mean":9.4347826087,"math_score_mean":9.35,"coding_score_w_mean":8.85,"coding_score_mean":8.85,"extraction_score_w_mean":8.6,"extraction_score_mean":8.6,"stem_score_w_mean":8.9,"stem_score_mean":8.9,"humanities_score_w_mean":9.0,"humanities_score_mean":9.0,"persian_general_knowledge_score_w_mean":5.2222222222,"persian_general_knowledge_score_mean":5.8083333333,"chatbot_rag_score_w_mean":9.4666666667,"chatbot_rag_score_mean":9.4333333333}
         | 
| 9 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.4522821577,"score_mean":8.3897306397,"writing_score_w_mean":8.4444444444,"writing_score_mean":8.475,"roleplay_score_w_mean":8.6785714286,"roleplay_score_mean":8.65,"reasoning_score_w_mean":8.4,"reasoning_score_mean":8.3333333333,"math_score_w_mean":9.0434782609,"math_score_mean":8.9,"coding_score_w_mean":7.05,"coding_score_mean":7.05,"extraction_score_w_mean":7.6,"extraction_score_mean":7.6,"stem_score_w_mean":8.4,"stem_score_mean":8.4,"humanities_score_w_mean":9.0,"humanities_score_mean":9.0,"persian_general_knowledge_score_w_mean":8.4074074074,"persian_general_knowledge_score_mean":8.4166666667,"chatbot_rag_score_w_mean":9.1538461538,"chatbot_rag_score_mean":9.1481481481}
         | 
| 10 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.3551020408,"score_mean":8.3716666667,"writing_score_w_mean":8.1481481481,"writing_score_mean":8.175,"roleplay_score_w_mean":7.5,"roleplay_score_mean":7.45,"reasoning_score_w_mean":8.4666666667,"reasoning_score_mean":8.4833333333,"math_score_w_mean":8.7391304348,"math_score_mean":8.8416666667,"coding_score_w_mean":7.85,"coding_score_mean":7.85,"extraction_score_w_mean":8.25,"extraction_score_mean":8.25,"stem_score_w_mean":8.6,"stem_score_mean":8.6,"humanities_score_w_mean":9.05,"humanities_score_mean":9.05,"persian_general_knowledge_score_w_mean":7.8888888889,"persian_general_knowledge_score_mean":7.9,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1166666667}
         | 
|  | |
|  | |
| 11 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.212244898,"score_mean":8.2441666667,"writing_score_w_mean":8.4074074074,"writing_score_mean":8.3166666667,"roleplay_score_w_mean":7.7857142857,"roleplay_score_mean":7.7583333333,"reasoning_score_w_mean":6.7666666667,"reasoning_score_mean":6.8,"math_score_w_mean":9.2608695652,"math_score_mean":9.3,"coding_score_w_mean":8.4,"coding_score_mean":8.4,"extraction_score_w_mean":8.1,"extraction_score_mean":8.1,"stem_score_w_mean":8.35,"stem_score_mean":8.35,"humanities_score_w_mean":8.8,"humanities_score_mean":8.8,"persian_general_knowledge_score_w_mean":7.5925925926,"persian_general_knowledge_score_mean":7.5083333333,"chatbot_rag_score_w_mean":9.1,"chatbot_rag_score_mean":9.1083333333}
         | 
| 12 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","score_w_mean":8.1795918367,"score_mean":8.2191666667,"writing_score_w_mean":8.1851851852,"writing_score_mean":8.25,"roleplay_score_w_mean":8.2857142857,"roleplay_score_mean":8.3333333333,"reasoning_score_w_mean":7.5333333333,"reasoning_score_mean":7.5416666667,"math_score_w_mean":9.0869565217,"math_score_mean":8.95,"coding_score_w_mean":8.3,"coding_score_mean":8.3,"extraction_score_w_mean":7.7,"extraction_score_mean":7.7,"stem_score_w_mean":8.4,"stem_score_mean":8.4,"humanities_score_w_mean":8.9,"humanities_score_mean":8.9,"persian_general_knowledge_score_w_mean":6.2962962963,"persian_general_knowledge_score_mean":6.4916666667,"chatbot_rag_score_w_mean":9.3333333333,"chatbot_rag_score_mean":9.325}
         | 
| 13 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","score_w_mean":7.8653061224,"score_mean":7.96,"writing_score_w_mean":8.3333333333,"writing_score_mean":8.3083333333,"roleplay_score_w_mean":7.6785714286,"roleplay_score_mean":7.5916666667,"reasoning_score_w_mean":7.0666666667,"reasoning_score_mean":7.2083333333,"math_score_w_mean":8.7826086957,"math_score_mean":8.65,"coding_score_w_mean":7.5,"coding_score_mean":7.5,"extraction_score_w_mean":8.4,"extraction_score_mean":8.4,"stem_score_w_mean":8.65,"stem_score_mean":8.65,"humanities_score_w_mean":8.85,"humanities_score_mean":8.85,"persian_general_knowledge_score_w_mean":4.8518518519,"persian_general_knowledge_score_mean":5.3083333333,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1333333333}
         | 
| 14 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":7.8081632653,"score_mean":7.8916666667,"writing_score_w_mean":7.962962963,"writing_score_mean":7.9666666667,"roleplay_score_w_mean":7.6071428571,"roleplay_score_mean":7.5083333333,"reasoning_score_w_mean":6.7666666667,"reasoning_score_mean":6.7166666667,"math_score_w_mean":8.2608695652,"math_score_mean":8.225,"coding_score_w_mean":7.85,"coding_score_mean":7.85,"extraction_score_w_mean":8.3,"extraction_score_mean":8.3,"stem_score_w_mean":8.5,"stem_score_mean":8.5,"humanities_score_w_mean":8.8,"humanities_score_mean":8.8,"persian_general_knowledge_score_w_mean":5.3703703704,"persian_general_knowledge_score_mean":5.7666666667,"chatbot_rag_score_w_mean":9.2666666667,"chatbot_rag_score_mean":9.2833333333}
         | 
| 15 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","score_w_mean":7.5371900826,"score_mean":7.632996633,"writing_score_w_mean":7.4074074074,"writing_score_mean":7.4083333333,"roleplay_score_w_mean":7.4642857143,"roleplay_score_mean":7.2833333333,"reasoning_score_w_mean":7.5185185185,"reasoning_score_mean":7.6296296296,"math_score_w_mean":9.0,"math_score_mean":8.85,"coding_score_w_mean":8.1,"coding_score_mean":8.1,"extraction_score_w_mean":7.75,"extraction_score_mean":7.75,"stem_score_w_mean":9.0,"stem_score_mean":9.0,"humanities_score_w_mean":9.05,"humanities_score_mean":9.05,"persian_general_knowledge_score_w_mean":1.8148148148,"persian_general_knowledge_score_mean":2.0083333333,"chatbot_rag_score_w_mean":9.2666666667,"chatbot_rag_score_mean":9.25}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":7.4857142857,"score_mean":7.585,"writing_score_w_mean":8.1111111111,"writing_score_mean":8.0416666667,"roleplay_score_w_mean":7.0357142857,"roleplay_score_mean":7.1833333333,"reasoning_score_w_mean":5.8,"reasoning_score_mean":5.65,"math_score_w_mean":8.4782608696,"math_score_mean":8.25,"coding_score_w_mean":8.05,"coding_score_mean":8.05,"extraction_score_w_mean":7.9,"extraction_score_mean":7.9,"stem_score_w_mean":7.7,"stem_score_mean":7.7,"humanities_score_w_mean":8.5,"humanities_score_mean":8.5,"persian_general_knowledge_score_w_mean":4.8518518519,"persian_general_knowledge_score_mean":5.375,"chatbot_rag_score_w_mean":9.1666666667,"chatbot_rag_score_mean":9.2}
         | 
|  | |
| 17 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","score_w_mean":7.3918367347,"score_mean":7.5125,"writing_score_w_mean":7.8888888889,"writing_score_mean":7.95,"roleplay_score_w_mean":7.7142857143,"roleplay_score_mean":7.6416666667,"reasoning_score_w_mean":5.4333333333,"reasoning_score_mean":5.3166666667,"math_score_w_mean":8.7391304348,"math_score_mean":8.7,"coding_score_w_mean":7.55,"coding_score_mean":7.55,"extraction_score_w_mean":7.7,"extraction_score_mean":7.7,"stem_score_w_mean":8.6,"stem_score_mean":8.6,"humanities_score_w_mean":8.9,"humanities_score_mean":8.9,"persian_general_knowledge_score_w_mean":3.1851851852,"persian_general_knowledge_score_mean":3.5166666667,"chatbot_rag_score_w_mean":9.2333333333,"chatbot_rag_score_mean":9.25}
         | 
| 18 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","score_w_mean":7.3613445378,"score_mean":7.4312714777,"writing_score_w_mean":7.0,"writing_score_mean":6.9083333333,"roleplay_score_w_mean":7.2307692308,"roleplay_score_mean":7.0185185185,"reasoning_score_w_mean":6.8518518519,"reasoning_score_mean":6.8981481481,"math_score_w_mean":9.5652173913,"math_score_mean":9.5,"coding_score_w_mean":8.6,"coding_score_mean":8.6,"extraction_score_w_mean":6.75,"extraction_score_mean":6.75,"stem_score_w_mean":8.2,"stem_score_mean":8.2,"humanities_score_w_mean":8.3,"humanities_score_mean":8.3,"persian_general_knowledge_score_w_mean":2.16,"persian_general_knowledge_score_mean":2.1851851852,"chatbot_rag_score_w_mean":9.3,"chatbot_rag_score_mean":9.3333333333}
         | 
|  | |
| 19 | 
             
            {"Model Name":"gpt-4.1-nano","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":7.2367346939,"score_mean":7.3633333333,"writing_score_w_mean":7.7407407407,"writing_score_mean":7.6666666667,"roleplay_score_w_mean":7.6428571429,"roleplay_score_mean":7.5416666667,"reasoning_score_w_mean":5.7,"reasoning_score_mean":6.0416666667,"math_score_w_mean":8.1304347826,"math_score_mean":8.25,"coding_score_w_mean":8.05,"coding_score_mean":8.05,"extraction_score_w_mean":5.95,"extraction_score_mean":5.95,"stem_score_w_mean":7.85,"stem_score_mean":7.85,"humanities_score_w_mean":8.7,"humanities_score_mean":8.7,"persian_general_knowledge_score_w_mean":3.9259259259,"persian_general_knowledge_score_mean":4.3833333333,"chatbot_rag_score_w_mean":9.1666666667,"chatbot_rag_score_mean":9.2}
         | 
| 20 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","score_w_mean":7.2448979592,"score_mean":7.2908333333,"writing_score_w_mean":7.2592592593,"writing_score_mean":7.2333333333,"roleplay_score_w_mean":6.8214285714,"roleplay_score_mean":6.6666666667,"reasoning_score_w_mean":6.3333333333,"reasoning_score_mean":6.2,"math_score_w_mean":8.5217391304,"math_score_mean":8.3,"coding_score_w_mean":7.6,"coding_score_mean":7.6,"extraction_score_w_mean":7.95,"extraction_score_mean":7.95,"stem_score_w_mean":7.3,"stem_score_mean":7.3,"humanities_score_w_mean":8.7,"humanities_score_mean":8.7,"persian_general_knowledge_score_w_mean":3.1481481481,"persian_general_knowledge_score_mean":3.4583333333,"chatbot_rag_score_w_mean":9.5333333333,"chatbot_rag_score_mean":9.5}
         | 
| 21 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","score_w_mean":7.1769547325,"score_mean":7.2045454545,"writing_score_w_mean":7.2222222222,"writing_score_mean":7.2,"roleplay_score_w_mean":7.3214285714,"roleplay_score_mean":7.2583333333,"reasoning_score_w_mean":7.3666666667,"reasoning_score_mean":7.2833333333,"math_score_w_mean":8.3913043478,"math_score_mean":8.325,"coding_score_w_mean":6.7,"coding_score_mean":6.7,"extraction_score_w_mean":7.05,"extraction_score_mean":7.05,"stem_score_w_mean":8.5,"stem_score_mean":8.5,"humanities_score_w_mean":8.7222222222,"humanities_score_mean":8.7222222222,"persian_general_knowledge_score_w_mean":1.6666666667,"persian_general_knowledge_score_mean":1.7333333333,"chatbot_rag_score_w_mean":9.4333333333,"chatbot_rag_score_mean":9.425}
         | 
|  | |
| 3 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.7983539095,"score_mean":8.8122895623,"writing_score_w_mean":8.52,"writing_score_mean":8.5462962963,"roleplay_score_w_mean":8.2857142857,"roleplay_score_mean":8.2583333333,"reasoning_score_w_mean":8.4666666667,"reasoning_score_mean":8.3666666667,"math_score_w_mean":9.652173913,"math_score_mean":9.6,"coding_score_w_mean":8.8,"coding_score_mean":8.8,"extraction_score_w_mean":8.75,"extraction_score_mean":8.75,"stem_score_w_mean":8.7,"stem_score_mean":8.7,"humanities_score_w_mean":9.0,"humanities_score_mean":9.0,"persian_general_knowledge_score_w_mean":8.8148148148,"persian_general_knowledge_score_mean":8.9166666667,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1583333333}
         | 
| 4 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.7428571429,"score_mean":8.7325,"writing_score_w_mean":8.4074074074,"writing_score_mean":8.3833333333,"roleplay_score_w_mean":8.6071428571,"roleplay_score_mean":8.625,"reasoning_score_w_mean":9.0666666667,"reasoning_score_mean":8.9666666667,"math_score_w_mean":9.7826086957,"math_score_mean":9.75,"coding_score_w_mean":8.15,"coding_score_mean":8.15,"extraction_score_w_mean":8.45,"extraction_score_mean":8.45,"stem_score_w_mean":8.7,"stem_score_mean":8.7,"humanities_score_w_mean":9.1,"humanities_score_mean":9.1,"persian_general_knowledge_score_w_mean":7.7777777778,"persian_general_knowledge_score_mean":7.9333333333,"chatbot_rag_score_w_mean":9.3,"chatbot_rag_score_mean":9.2666666667}
         | 
| 5 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.7510204082,"score_mean":8.695,"writing_score_w_mean":8.5925925926,"writing_score_mean":8.625,"roleplay_score_w_mean":8.2142857143,"roleplay_score_mean":8.2166666667,"reasoning_score_w_mean":9.0666666667,"reasoning_score_mean":8.7833333333,"math_score_w_mean":9.7826086957,"math_score_mean":9.75,"coding_score_w_mean":7.85,"coding_score_mean":7.85,"extraction_score_w_mean":8.6,"extraction_score_mean":8.6,"stem_score_w_mean":8.55,"stem_score_mean":8.55,"humanities_score_w_mean":9.2,"humanities_score_mean":9.2,"persian_general_knowledge_score_w_mean":8.1481481481,"persian_general_knowledge_score_mean":8.0,"chatbot_rag_score_w_mean":9.3666666667,"chatbot_rag_score_mean":9.375}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.5632653061,"score_mean":8.6775,"writing_score_w_mean":7.7037037037,"writing_score_mean":7.675,"roleplay_score_w_mean":8.3928571429,"roleplay_score_mean":8.4166666667,"reasoning_score_w_mean":9.0333333333,"reasoning_score_mean":9.1166666667,"math_score_w_mean":9.652173913,"math_score_mean":9.6,"coding_score_w_mean":9.2,"coding_score_mean":9.2,"extraction_score_w_mean":9.15,"extraction_score_mean":9.15,"stem_score_w_mean":9.0,"stem_score_mean":9.0,"humanities_score_w_mean":9.2,"humanities_score_mean":9.2,"persian_general_knowledge_score_w_mean":5.5925925926,"persian_general_knowledge_score_mean":6.05,"chatbot_rag_score_w_mean":9.3333333333,"chatbot_rag_score_mean":9.3666666667}
         | 
| 7 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","score_w_mean":8.5795918367,"score_mean":8.6175,"writing_score_w_mean":8.6296296296,"writing_score_mean":8.65,"roleplay_score_w_mean":8.1785714286,"roleplay_score_mean":8.225,"reasoning_score_w_mean":8.9,"reasoning_score_mean":8.7416666667,"math_score_w_mean":9.3043478261,"math_score_mean":9.2,"coding_score_w_mean":8.75,"coding_score_mean":8.75,"extraction_score_w_mean":8.5,"extraction_score_mean":8.5,"stem_score_w_mean":8.55,"stem_score_mean":8.55,"humanities_score_w_mean":9.15,"humanities_score_mean":9.15,"persian_general_knowledge_score_w_mean":6.8148148148,"persian_general_knowledge_score_mean":7.2416666667,"chatbot_rag_score_w_mean":9.2,"chatbot_rag_score_mean":9.1666666667}
         | 
| 8 | 
             
            {"Model Name":"deepseek-chat","thinking_method":"β","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","score_w_mean":8.5102040816,"score_mean":8.6008333333,"writing_score_w_mean":8.4444444444,"writing_score_mean":8.4916666667,"roleplay_score_w_mean":8.9285714286,"roleplay_score_mean":8.9666666667,"reasoning_score_w_mean":8.3666666667,"reasoning_score_mean":8.3083333333,"math_score_w_mean":9.1304347826,"math_score_mean":9.0,"coding_score_w_mean":9.35,"coding_score_mean":9.35,"extraction_score_w_mean":8.65,"extraction_score_mean":8.65,"stem_score_w_mean":9.05,"stem_score_mean":9.05,"humanities_score_w_mean":9.25,"humanities_score_mean":9.25,"persian_general_knowledge_score_w_mean":5.0740740741,"persian_general_knowledge_score_mean":5.4916666667,"chatbot_rag_score_w_mean":9.4333333333,"chatbot_rag_score_mean":9.45}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.3183673469,"score_mean":8.4183333333,"writing_score_w_mean":8.1111111111,"writing_score_mean":8.125,"roleplay_score_w_mean":8.0714285714,"roleplay_score_mean":8.0333333333,"reasoning_score_w_mean":8.1333333333,"reasoning_score_mean":8.0833333333,"math_score_w_mean":9.4347826087,"math_score_mean":9.35,"coding_score_w_mean":8.85,"coding_score_mean":8.85,"extraction_score_w_mean":8.6,"extraction_score_mean":8.6,"stem_score_w_mean":8.9,"stem_score_mean":8.9,"humanities_score_w_mean":9.0,"humanities_score_mean":9.0,"persian_general_knowledge_score_w_mean":5.2222222222,"persian_general_knowledge_score_mean":5.8083333333,"chatbot_rag_score_w_mean":9.4666666667,"chatbot_rag_score_mean":9.4333333333}
         | 
| 10 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.4522821577,"score_mean":8.3897306397,"writing_score_w_mean":8.4444444444,"writing_score_mean":8.475,"roleplay_score_w_mean":8.6785714286,"roleplay_score_mean":8.65,"reasoning_score_w_mean":8.4,"reasoning_score_mean":8.3333333333,"math_score_w_mean":9.0434782609,"math_score_mean":8.9,"coding_score_w_mean":7.05,"coding_score_mean":7.05,"extraction_score_w_mean":7.6,"extraction_score_mean":7.6,"stem_score_w_mean":8.4,"stem_score_mean":8.4,"humanities_score_w_mean":9.0,"humanities_score_mean":9.0,"persian_general_knowledge_score_w_mean":8.4074074074,"persian_general_knowledge_score_mean":8.4166666667,"chatbot_rag_score_w_mean":9.1538461538,"chatbot_rag_score_mean":9.1481481481}
         | 
| 11 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.3551020408,"score_mean":8.3716666667,"writing_score_w_mean":8.1481481481,"writing_score_mean":8.175,"roleplay_score_w_mean":7.5,"roleplay_score_mean":7.45,"reasoning_score_w_mean":8.4666666667,"reasoning_score_mean":8.4833333333,"math_score_w_mean":8.7391304348,"math_score_mean":8.8416666667,"coding_score_w_mean":7.85,"coding_score_mean":7.85,"extraction_score_w_mean":8.25,"extraction_score_mean":8.25,"stem_score_w_mean":8.6,"stem_score_mean":8.6,"humanities_score_w_mean":9.05,"humanities_score_mean":9.05,"persian_general_knowledge_score_w_mean":7.8888888889,"persian_general_knowledge_score_mean":7.9,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1166666667}
         | 
| 12 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","score_w_mean":8.2857142857,"score_mean":8.3158333333,"writing_score_w_mean":8.2222222222,"writing_score_mean":8.1083333333,"roleplay_score_w_mean":7.8928571429,"roleplay_score_mean":7.725,"reasoning_score_w_mean":8.9333333333,"reasoning_score_mean":8.6666666667,"math_score_w_mean":9.6956521739,"math_score_mean":9.65,"coding_score_w_mean":9.4,"coding_score_mean":9.4,"extraction_score_w_mean":8.5,"extraction_score_mean":8.5,"stem_score_w_mean":8.8,"stem_score_mean":8.8,"humanities_score_w_mean":8.85,"humanities_score_mean":8.85,"persian_general_knowledge_score_w_mean":3.5925925926,"persian_general_knowledge_score_mean":3.9416666667,"chatbot_rag_score_w_mean":9.6,"chatbot_rag_score_mean":9.5166666667}
         | 
| 13 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.2244897959,"score_mean":8.2825,"writing_score_w_mean":8.1481481481,"writing_score_mean":8.1166666667,"roleplay_score_w_mean":7.75,"roleplay_score_mean":7.625,"reasoning_score_w_mean":8.4333333333,"reasoning_score_mean":8.2666666667,"math_score_w_mean":9.652173913,"math_score_mean":9.6,"coding_score_w_mean":9.1,"coding_score_mean":9.1,"extraction_score_w_mean":7.65,"extraction_score_mean":7.65,"stem_score_w_mean":8.6,"stem_score_mean":8.6,"humanities_score_w_mean":8.85,"humanities_score_mean":8.85,"persian_general_knowledge_score_w_mean":5.3703703704,"persian_general_knowledge_score_mean":5.8833333333,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1333333333}
         | 
| 14 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":8.212244898,"score_mean":8.2441666667,"writing_score_w_mean":8.4074074074,"writing_score_mean":8.3166666667,"roleplay_score_w_mean":7.7857142857,"roleplay_score_mean":7.7583333333,"reasoning_score_w_mean":6.7666666667,"reasoning_score_mean":6.8,"math_score_w_mean":9.2608695652,"math_score_mean":9.3,"coding_score_w_mean":8.4,"coding_score_mean":8.4,"extraction_score_w_mean":8.1,"extraction_score_mean":8.1,"stem_score_w_mean":8.35,"stem_score_mean":8.35,"humanities_score_w_mean":8.8,"humanities_score_mean":8.8,"persian_general_knowledge_score_w_mean":7.5925925926,"persian_general_knowledge_score_mean":7.5083333333,"chatbot_rag_score_w_mean":9.1,"chatbot_rag_score_mean":9.1083333333}
         | 
| 15 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","score_w_mean":8.1795918367,"score_mean":8.2191666667,"writing_score_w_mean":8.1851851852,"writing_score_mean":8.25,"roleplay_score_w_mean":8.2857142857,"roleplay_score_mean":8.3333333333,"reasoning_score_w_mean":7.5333333333,"reasoning_score_mean":7.5416666667,"math_score_w_mean":9.0869565217,"math_score_mean":8.95,"coding_score_w_mean":8.3,"coding_score_mean":8.3,"extraction_score_w_mean":7.7,"extraction_score_mean":7.7,"stem_score_w_mean":8.4,"stem_score_mean":8.4,"humanities_score_w_mean":8.9,"humanities_score_mean":8.9,"persian_general_knowledge_score_w_mean":6.2962962963,"persian_general_knowledge_score_mean":6.4916666667,"chatbot_rag_score_w_mean":9.3333333333,"chatbot_rag_score_mean":9.325}
         | 
| 16 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","score_w_mean":7.8653061224,"score_mean":7.96,"writing_score_w_mean":8.3333333333,"writing_score_mean":8.3083333333,"roleplay_score_w_mean":7.6785714286,"roleplay_score_mean":7.5916666667,"reasoning_score_w_mean":7.0666666667,"reasoning_score_mean":7.2083333333,"math_score_w_mean":8.7826086957,"math_score_mean":8.65,"coding_score_w_mean":7.5,"coding_score_mean":7.5,"extraction_score_w_mean":8.4,"extraction_score_mean":8.4,"stem_score_w_mean":8.65,"stem_score_mean":8.65,"humanities_score_w_mean":8.85,"humanities_score_mean":8.85,"persian_general_knowledge_score_w_mean":4.8518518519,"persian_general_knowledge_score_mean":5.3083333333,"chatbot_rag_score_w_mean":9.1333333333,"chatbot_rag_score_mean":9.1333333333}
         | 
| 17 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":7.8081632653,"score_mean":7.8916666667,"writing_score_w_mean":7.962962963,"writing_score_mean":7.9666666667,"roleplay_score_w_mean":7.6071428571,"roleplay_score_mean":7.5083333333,"reasoning_score_w_mean":6.7666666667,"reasoning_score_mean":6.7166666667,"math_score_w_mean":8.2608695652,"math_score_mean":8.225,"coding_score_w_mean":7.85,"coding_score_mean":7.85,"extraction_score_w_mean":8.3,"extraction_score_mean":8.3,"stem_score_w_mean":8.5,"stem_score_mean":8.5,"humanities_score_w_mean":8.8,"humanities_score_mean":8.8,"persian_general_knowledge_score_w_mean":5.3703703704,"persian_general_knowledge_score_mean":5.7666666667,"chatbot_rag_score_w_mean":9.2666666667,"chatbot_rag_score_mean":9.2833333333}
         | 
| 18 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","score_w_mean":7.5371900826,"score_mean":7.632996633,"writing_score_w_mean":7.4074074074,"writing_score_mean":7.4083333333,"roleplay_score_w_mean":7.4642857143,"roleplay_score_mean":7.2833333333,"reasoning_score_w_mean":7.5185185185,"reasoning_score_mean":7.6296296296,"math_score_w_mean":9.0,"math_score_mean":8.85,"coding_score_w_mean":8.1,"coding_score_mean":8.1,"extraction_score_w_mean":7.75,"extraction_score_mean":7.75,"stem_score_w_mean":9.0,"stem_score_mean":9.0,"humanities_score_w_mean":9.05,"humanities_score_mean":9.05,"persian_general_knowledge_score_w_mean":1.8148148148,"persian_general_knowledge_score_mean":2.0083333333,"chatbot_rag_score_w_mean":9.2666666667,"chatbot_rag_score_mean":9.25}
         | 
| 19 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":7.4857142857,"score_mean":7.585,"writing_score_w_mean":8.1111111111,"writing_score_mean":8.0416666667,"roleplay_score_w_mean":7.0357142857,"roleplay_score_mean":7.1833333333,"reasoning_score_w_mean":5.8,"reasoning_score_mean":5.65,"math_score_w_mean":8.4782608696,"math_score_mean":8.25,"coding_score_w_mean":8.05,"coding_score_mean":8.05,"extraction_score_w_mean":7.9,"extraction_score_mean":7.9,"stem_score_w_mean":7.7,"stem_score_mean":7.7,"humanities_score_w_mean":8.5,"humanities_score_mean":8.5,"persian_general_knowledge_score_w_mean":4.8518518519,"persian_general_knowledge_score_mean":5.375,"chatbot_rag_score_w_mean":9.1666666667,"chatbot_rag_score_mean":9.2}
         | 
| 20 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","score_w_mean":7.4326530612,"score_mean":7.5308333333,"writing_score_w_mean":7.8148148148,"writing_score_mean":7.7166666667,"roleplay_score_w_mean":5.6071428571,"roleplay_score_mean":5.2666666667,"reasoning_score_w_mean":7.4333333333,"reasoning_score_mean":7.4416666667,"math_score_w_mean":10.0,"math_score_mean":10.0,"coding_score_w_mean":8.55,"coding_score_mean":8.55,"extraction_score_w_mean":8.15,"extraction_score_mean":8.15,"stem_score_w_mean":8.3,"stem_score_mean":8.3,"humanities_score_w_mean":8.85,"humanities_score_mean":8.85,"persian_general_knowledge_score_w_mean":1.6296296296,"persian_general_knowledge_score_mean":1.75,"chatbot_rag_score_w_mean":9.3,"chatbot_rag_score_mean":9.2833333333}
         | 
| 21 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","score_w_mean":7.3918367347,"score_mean":7.5125,"writing_score_w_mean":7.8888888889,"writing_score_mean":7.95,"roleplay_score_w_mean":7.7142857143,"roleplay_score_mean":7.6416666667,"reasoning_score_w_mean":5.4333333333,"reasoning_score_mean":5.3166666667,"math_score_w_mean":8.7391304348,"math_score_mean":8.7,"coding_score_w_mean":7.55,"coding_score_mean":7.55,"extraction_score_w_mean":7.7,"extraction_score_mean":7.7,"stem_score_w_mean":8.6,"stem_score_mean":8.6,"humanities_score_w_mean":8.9,"humanities_score_mean":8.9,"persian_general_knowledge_score_w_mean":3.1851851852,"persian_general_knowledge_score_mean":3.5166666667,"chatbot_rag_score_w_mean":9.2333333333,"chatbot_rag_score_mean":9.25}
         | 
| 22 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","score_w_mean":7.3613445378,"score_mean":7.4312714777,"writing_score_w_mean":7.0,"writing_score_mean":6.9083333333,"roleplay_score_w_mean":7.2307692308,"roleplay_score_mean":7.0185185185,"reasoning_score_w_mean":6.8518518519,"reasoning_score_mean":6.8981481481,"math_score_w_mean":9.5652173913,"math_score_mean":9.5,"coding_score_w_mean":8.6,"coding_score_mean":8.6,"extraction_score_w_mean":6.75,"extraction_score_mean":6.75,"stem_score_w_mean":8.2,"stem_score_mean":8.2,"humanities_score_w_mean":8.3,"humanities_score_mean":8.3,"persian_general_knowledge_score_w_mean":2.16,"persian_general_knowledge_score_mean":2.1851851852,"chatbot_rag_score_w_mean":9.3,"chatbot_rag_score_mean":9.3333333333}
         | 
| 23 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https_google.com","parameters_count":"109000000000","source_type":"Open-Source","score_w_mean":7.3142857143,"score_mean":7.4175,"writing_score_w_mean":7.5925925926,"writing_score_mean":7.575,"roleplay_score_w_mean":7.2142857143,"roleplay_score_mean":7.1833333333,"reasoning_score_w_mean":6.6,"reasoning_score_mean":6.5916666667,"math_score_w_mean":8.3043478261,"math_score_mean":8.5083333333,"coding_score_w_mean":7.3,"coding_score_mean":7.3,"extraction_score_w_mean":8.25,"extraction_score_mean":8.25,"stem_score_w_mean":7.75,"stem_score_mean":7.75,"humanities_score_w_mean":8.55,"humanities_score_mean":8.55,"persian_general_knowledge_score_w_mean":3.1111111111,"persian_general_knowledge_score_mean":3.4333333333,"chatbot_rag_score_w_mean":9.1666666667,"chatbot_rag_score_mean":9.0333333333}
         | 
| 24 | 
             
            {"Model Name":"gpt-4.1-nano","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","score_w_mean":7.2367346939,"score_mean":7.3633333333,"writing_score_w_mean":7.7407407407,"writing_score_mean":7.6666666667,"roleplay_score_w_mean":7.6428571429,"roleplay_score_mean":7.5416666667,"reasoning_score_w_mean":5.7,"reasoning_score_mean":6.0416666667,"math_score_w_mean":8.1304347826,"math_score_mean":8.25,"coding_score_w_mean":8.05,"coding_score_mean":8.05,"extraction_score_w_mean":5.95,"extraction_score_mean":5.95,"stem_score_w_mean":7.85,"stem_score_mean":7.85,"humanities_score_w_mean":8.7,"humanities_score_mean":8.7,"persian_general_knowledge_score_w_mean":3.9259259259,"persian_general_knowledge_score_mean":4.3833333333,"chatbot_rag_score_w_mean":9.1666666667,"chatbot_rag_score_mean":9.2}
         | 
| 25 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","score_w_mean":7.2448979592,"score_mean":7.2908333333,"writing_score_w_mean":7.2592592593,"writing_score_mean":7.2333333333,"roleplay_score_w_mean":6.8214285714,"roleplay_score_mean":6.6666666667,"reasoning_score_w_mean":6.3333333333,"reasoning_score_mean":6.2,"math_score_w_mean":8.5217391304,"math_score_mean":8.3,"coding_score_w_mean":7.6,"coding_score_mean":7.6,"extraction_score_w_mean":7.95,"extraction_score_mean":7.95,"stem_score_w_mean":7.3,"stem_score_mean":7.3,"humanities_score_w_mean":8.7,"humanities_score_mean":8.7,"persian_general_knowledge_score_w_mean":3.1481481481,"persian_general_knowledge_score_mean":3.4583333333,"chatbot_rag_score_w_mean":9.5333333333,"chatbot_rag_score_mean":9.5}
         | 
| 26 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","score_w_mean":7.1769547325,"score_mean":7.2045454545,"writing_score_w_mean":7.2222222222,"writing_score_mean":7.2,"roleplay_score_w_mean":7.3214285714,"roleplay_score_mean":7.2583333333,"reasoning_score_w_mean":7.3666666667,"reasoning_score_mean":7.2833333333,"math_score_w_mean":8.3913043478,"math_score_mean":8.325,"coding_score_w_mean":6.7,"coding_score_mean":6.7,"extraction_score_w_mean":7.05,"extraction_score_mean":7.05,"stem_score_w_mean":8.5,"stem_score_mean":8.5,"humanities_score_w_mean":8.7222222222,"humanities_score_mean":8.7222222222,"persian_general_knowledge_score_w_mean":1.6666666667,"persian_general_knowledge_score_mean":1.7333333333,"chatbot_rag_score_w_mean":9.4333333333,"chatbot_rag_score_mean":9.425}
         | 
    	
        leaderboard/boards_data/ner_arman.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.578306047,"ner_arman_precision_mean":0.5583631307,"ner_arman_recall_mean":0.6250099325,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","ner_arman_f1_mean":0.3839211973,"ner_arman_precision_mean":0.3292326466,"ner_arman_recall_mean":0.5049662296,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","ner_arman_f1_mean":0.0031613599,"ner_arman_precision_mean":0.0024235201,"ner_arman_recall_mean":0.0047675805,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","ner_arman_f1_mean":0.5030535945,"ner_arman_precision_mean":0.4617288155,"ner_arman_recall_mean":0.5952522845,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.3097820535,"ner_arman_precision_mean":0.2833333333,"ner_arman_recall_mean":0.3710568137,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":null,"ner_arman_precision_mean":null,"ner_arman_recall_mean":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","ner_arman_f1_mean":0.5091463761,"ner_arman_precision_mean":0.4719705999,"ner_arman_recall_mean":0.5898887565,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","ner_arman_f1_mean":0.492138652,"ner_arman_precision_mean":0.4553833929,"ner_arman_recall_mean":0.5783671037,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","ner_arman_f1_mean":0.4408498401,"ner_arman_precision_mean":0.4206197855,"ner_arman_recall_mean":0.487067938,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.0134154417,"ner_arman_precision_mean":0.0131505761,"ner_arman_recall_mean":0.0147993643,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","ner_arman_f1_mean":0.028185021,"ner_arman_precision_mean":0.0278440732,"ner_arman_recall_mean":0.0304295943,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","ner_arman_f1_mean":0.1404403172,"ner_arman_precision_mean":0.1243629037,"ner_arman_recall_mean":0.1826181963,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.578306047,"ner_arman_precision_mean":0.5583631307,"ner_arman_recall_mean":0.6250099325,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","ner_arman_f1_mean":0.1239012808,"ner_arman_precision_mean":0.1171036949,"ner_arman_recall_mean":0.1388160509,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","ner_arman_f1_mean":0.3839211973,"ner_arman_precision_mean":0.3292326466,"ner_arman_recall_mean":0.5049662296,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","ner_arman_f1_mean":0.0031613599,"ner_arman_precision_mean":0.0024235201,"ner_arman_recall_mean":0.0047675805,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.5087496797,"ner_arman_precision_mean":0.4749602702,"ner_arman_recall_mean":0.5891338896,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.5238146835,"ner_arman_precision_mean":0.511958681,"ner_arman_recall_mean":0.5638855781,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","ner_arman_f1_mean":0.1833647216,"ner_arman_precision_mean":0.1720756002,"ner_arman_recall_mean":0.2118990862,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","ner_arman_f1_mean":0.5030535945,"ner_arman_precision_mean":0.4617288155,"ner_arman_recall_mean":0.5952522845,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.3097820535,"ner_arman_precision_mean":0.2833333333,"ner_arman_recall_mean":0.3710568137,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":null,"ner_arman_precision_mean":null,"ner_arman_recall_mean":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","ner_arman_f1_mean":0.5091463761,"ner_arman_precision_mean":0.4719705999,"ner_arman_recall_mean":0.5898887565,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","ner_arman_f1_mean":0.492138652,"ner_arman_precision_mean":0.4553833929,"ner_arman_recall_mean":0.5783671037,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","ner_arman_f1_mean":0.4408498401,"ner_arman_precision_mean":0.4206197855,"ner_arman_recall_mean":0.487067938,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","ner_arman_f1_mean":0.1349481402,"ner_arman_precision_mean":0.1235087122,"ner_arman_recall_mean":0.1586809694,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","ner_arman_f1_mean":0.0134154417,"ner_arman_precision_mean":0.0131505761,"ner_arman_recall_mean":0.0147993643,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","ner_arman_f1_mean":0.028185021,"ner_arman_precision_mean":0.0278440732,"ner_arman_recall_mean":0.0304295943,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","ner_arman_f1_mean":0.1404403172,"ner_arman_precision_mean":0.1243629037,"ner_arman_recall_mean":0.1826181963,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/nli_farstail.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.868286445,"nli_farstail_precision_modified":0.8795611895,"nli_farstail_recall_modified":0.8694171245,"nli_farstail_fscore_modified":0.8680818161,"nli_farstail_acc":0.868286445,"nli_farstail_precision":0.8795611895,"nli_farstail_recall":0.8694171245,"nli_farstail_fscore":0.8680818161,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6361892583,"nli_farstail_precision_modified":0.6743240456,"nli_farstail_recall_modified":0.6374538968,"nli_farstail_fscore_modified":0.621131875,"nli_farstail_acc":0.6370038412,"nli_farstail_precision":0.6751874567,"nli_farstail_recall":0.638270099,"nli_farstail_fscore":0.6219271782,"nli_farstail_valid_output_ratio":0.9987212276,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6898976982,"nli_farstail_precision_modified":0.752223151,"nli_farstail_recall_modified":0.691698665,"nli_farstail_fscore_modified":0.6834607357,"nli_farstail_acc":0.6898976982,"nli_farstail_precision":0.752223151,"nli_farstail_recall":0.691698665,"nli_farstail_fscore":0.6834607357,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7078005115,"nli_farstail_precision_modified":0.7418983007,"nli_farstail_recall_modified":0.70995102,"nli_farstail_fscore_modified":0.6987179454,"nli_farstail_acc":0.7091607944,"nli_farstail_precision":0.7433241143,"nli_farstail_recall":0.7113154358,"nli_farstail_fscore":0.700060773,"nli_farstail_valid_output_ratio":0.9980818414,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.8069053708,"nli_farstail_precision_modified":0.8274480721,"nli_farstail_recall_modified":0.8078020735,"nli_farstail_fscore_modified":0.8055860349,"nli_farstail_acc":0.8069053708,"nli_farstail_precision":0.8274480721,"nli_farstail_recall":0.8078020735,"nli_farstail_fscore":0.8055860349,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":null,"nli_farstail_precision_modified":null,"nli_farstail_recall_modified":null,"nli_farstail_fscore_modified":null,"nli_farstail_acc":null,"nli_farstail_precision":null,"nli_farstail_recall":null,"nli_farstail_fscore":null,"nli_farstail_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6918158568,"nli_farstail_precision_modified":0.76120773,"nli_farstail_recall_modified":0.696633339,"nli_farstail_fscore_modified":0.6637995215,"nli_farstail_acc":0.6918158568,"nli_farstail_precision":0.76120773,"nli_farstail_recall":0.696633339,"nli_farstail_fscore":0.6637995215,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7007672634,"nli_farstail_precision_modified":0.7596784307,"nli_farstail_recall_modified":0.7039816989,"nli_farstail_fscore_modified":0.6834876952,"nli_farstail_acc":0.7007672634,"nli_farstail_precision":0.7596784307,"nli_farstail_recall":0.7039816989,"nli_farstail_fscore":0.6834876952,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","nli_farstail_acc_modified":0.716112532,"nli_farstail_precision_modified":0.7794942647,"nli_farstail_recall_modified":0.7185458002,"nli_farstail_fscore_modified":0.7094139725,"nli_farstail_acc":0.716112532,"nli_farstail_precision":0.7794942647,"nli_farstail_recall":0.7185458002,"nli_farstail_fscore":0.7094139725,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.0249360614,"nli_farstail_precision_modified":0.0160900081,"nli_farstail_recall_modified":0.0174126172,"nli_farstail_fscore_modified":0.0167242212,"nli_farstail_acc":0.9069767442,"nli_farstail_precision":0.5852272727,"nli_farstail_recall":0.6333333333,"nli_farstail_fscore":0.6082949309,"nli_farstail_valid_output_ratio":0.0274936061,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7461636829,"nli_farstail_precision_modified":0.8279044878,"nli_farstail_recall_modified":0.7431719278,"nli_farstail_fscore_modified":0.7484099134,"nli_farstail_acc":0.7461636829,"nli_farstail_precision":0.8279044878,"nli_farstail_recall":0.7431719278,"nli_farstail_fscore":0.7484099134,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","nli_farstail_acc_modified":0.618286445,"nli_farstail_precision_modified":0.6499905475,"nli_farstail_recall_modified":0.6180562888,"nli_farstail_fscore_modified":0.612547215,"nli_farstail_acc":0.6254851229,"nli_farstail_precision":0.6575583547,"nli_farstail_recall":0.625252287,"nli_farstail_fscore":0.6196790713,"nli_farstail_valid_output_ratio":0.9884910486,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.868286445,"nli_farstail_precision_modified":0.8795611895,"nli_farstail_recall_modified":0.8694171245,"nli_farstail_fscore_modified":0.8680818161,"nli_farstail_acc":0.868286445,"nli_farstail_precision":0.8795611895,"nli_farstail_recall":0.8694171245,"nli_farstail_fscore":0.8680818161,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7384910486,"nli_farstail_precision_modified":0.7662350641,"nli_farstail_recall_modified":0.7395626513,"nli_farstail_fscore_modified":0.7354972179,"nli_farstail_acc":0.7399103139,"nli_farstail_precision":0.7677076491,"nli_farstail_recall":0.7409839761,"nli_farstail_fscore":0.7369107296,"nli_farstail_valid_output_ratio":0.9980818414,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6361892583,"nli_farstail_precision_modified":0.6743240456,"nli_farstail_recall_modified":0.6374538968,"nli_farstail_fscore_modified":0.621131875,"nli_farstail_acc":0.6370038412,"nli_farstail_precision":0.6751874567,"nli_farstail_recall":0.638270099,"nli_farstail_fscore":0.6219271782,"nli_farstail_valid_output_ratio":0.9987212276,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6898976982,"nli_farstail_precision_modified":0.752223151,"nli_farstail_recall_modified":0.691698665,"nli_farstail_fscore_modified":0.6834607357,"nli_farstail_acc":0.6898976982,"nli_farstail_precision":0.752223151,"nli_farstail_recall":0.691698665,"nli_farstail_fscore":0.6834607357,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.8542199488,"nli_farstail_precision_modified":0.8634293173,"nli_farstail_recall_modified":0.8539318442,"nli_farstail_fscore_modified":0.8536753404,"nli_farstail_acc":0.8553137004,"nli_farstail_precision":0.8645348606,"nli_farstail_recall":0.8550252268,"nli_farstail_fscore":0.8547683946,"nli_farstail_valid_output_ratio":0.9987212276,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.7653452685,"nli_farstail_precision_modified":0.7847248212,"nli_farstail_recall_modified":0.7659002614,"nli_farstail_fscore_modified":0.7629523234,"nli_farstail_acc":0.7653452685,"nli_farstail_precision":0.7847248212,"nli_farstail_recall":0.7659002614,"nli_farstail_fscore":0.7629523234,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7608695652,"nli_farstail_precision_modified":0.7778206934,"nli_farstail_recall_modified":0.762421143,"nli_farstail_fscore_modified":0.7569520417,"nli_farstail_acc":0.7608695652,"nli_farstail_precision":0.7778206934,"nli_farstail_recall":0.762421143,"nli_farstail_fscore":0.7569520417,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7078005115,"nli_farstail_precision_modified":0.7418983007,"nli_farstail_recall_modified":0.70995102,"nli_farstail_fscore_modified":0.6987179454,"nli_farstail_acc":0.7091607944,"nli_farstail_precision":0.7433241143,"nli_farstail_recall":0.7113154358,"nli_farstail_fscore":0.700060773,"nli_farstail_valid_output_ratio":0.9980818414,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.8069053708,"nli_farstail_precision_modified":0.8274480721,"nli_farstail_recall_modified":0.8078020735,"nli_farstail_fscore_modified":0.8055860349,"nli_farstail_acc":0.8069053708,"nli_farstail_precision":0.8274480721,"nli_farstail_recall":0.8078020735,"nli_farstail_fscore":0.8055860349,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":null,"nli_farstail_precision_modified":null,"nli_farstail_recall_modified":null,"nli_farstail_fscore_modified":null,"nli_farstail_acc":null,"nli_farstail_precision":null,"nli_farstail_recall":null,"nli_farstail_fscore":null,"nli_farstail_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6918158568,"nli_farstail_precision_modified":0.76120773,"nli_farstail_recall_modified":0.696633339,"nli_farstail_fscore_modified":0.6637995215,"nli_farstail_acc":0.6918158568,"nli_farstail_precision":0.76120773,"nli_farstail_recall":0.696633339,"nli_farstail_fscore":0.6637995215,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7007672634,"nli_farstail_precision_modified":0.7596784307,"nli_farstail_recall_modified":0.7039816989,"nli_farstail_fscore_modified":0.6834876952,"nli_farstail_acc":0.7007672634,"nli_farstail_precision":0.7596784307,"nli_farstail_recall":0.7039816989,"nli_farstail_fscore":0.6834876952,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","nli_farstail_acc_modified":0.716112532,"nli_farstail_precision_modified":0.7794942647,"nli_farstail_recall_modified":0.7185458002,"nli_farstail_fscore_modified":0.7094139725,"nli_farstail_acc":0.716112532,"nli_farstail_precision":0.7794942647,"nli_farstail_recall":0.7185458002,"nli_farstail_fscore":0.7094139725,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.6822250639,"nli_farstail_precision_modified":0.7615681175,"nli_farstail_recall_modified":0.6809278738,"nli_farstail_fscore_modified":0.6476118203,"nli_farstail_acc":0.7033618985,"nli_farstail_precision":0.7851631746,"nli_farstail_recall":0.7020245185,"nli_farstail_fscore":0.6676762603,"nli_farstail_valid_output_ratio":0.9699488491,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","nli_farstail_acc_modified":0.0249360614,"nli_farstail_precision_modified":0.0160900081,"nli_farstail_recall_modified":0.0174126172,"nli_farstail_fscore_modified":0.0167242212,"nli_farstail_acc":0.9069767442,"nli_farstail_precision":0.5852272727,"nli_farstail_recall":0.6333333333,"nli_farstail_fscore":0.6082949309,"nli_farstail_valid_output_ratio":0.0274936061,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","nli_farstail_acc_modified":0.7461636829,"nli_farstail_precision_modified":0.8279044878,"nli_farstail_recall_modified":0.7431719278,"nli_farstail_fscore_modified":0.7484099134,"nli_farstail_acc":0.7461636829,"nli_farstail_precision":0.8279044878,"nli_farstail_recall":0.7431719278,"nli_farstail_fscore":0.7484099134,"nli_farstail_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","nli_farstail_acc_modified":0.618286445,"nli_farstail_precision_modified":0.6499905475,"nli_farstail_recall_modified":0.6180562888,"nli_farstail_fscore_modified":0.612547215,"nli_farstail_acc":0.6254851229,"nli_farstail_precision":0.6575583547,"nli_farstail_recall":0.625252287,"nli_farstail_fscore":0.6196790713,"nli_farstail_valid_output_ratio":0.9884910486,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/paraphrase-detection_FarsiParaphraseDetection.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.877394636,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9117647059,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8567164179,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8679892098,"paraphrase-detection_FarsiParaphraseDetection_acc":0.877394636,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9117647059,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8567164179,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8679892098,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8697318008,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9057190558,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8481376599,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8593214965,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8697318008,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9057190558,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8481376599,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8593214965,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8595146871,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9014336918,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8358208955,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8471137461,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8595146871,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9014336918,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8358208955,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8471137461,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":null,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":null,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":null,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":null,"paraphrase-detection_FarsiParaphraseDetection_acc":null,"paraphrase-detection_FarsiParaphraseDetection_precision":null,"paraphrase-detection_FarsiParaphraseDetection_recall":null,"paraphrase-detection_FarsiParaphraseDetection_fscore":null,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.9029374202,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9262452107,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8869436301,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.897066353,"paraphrase-detection_FarsiParaphraseDetection_acc":0.9029374202,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9262452107,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8869436301,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.897066353,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8390804598,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8902439024,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8119402985,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8225473409,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8390804598,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8902439024,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8119402985,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8225473409,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8952745849,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9226415094,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8776119403,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8883498185,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8952745849,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9226415094,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8776119403,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8883498185,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8556832695,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8960759725,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8314059789,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8433777185,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8634020619,"paraphrase-detection_FarsiParaphraseDetection_precision":0.904159132,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8389057751,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8509855072,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":0.9910600255,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.680715198,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8209169054,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.6268656716,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.5933059088,"paraphrase-detection_FarsiParaphraseDetection_acc":0.680715198,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8209169054,"paraphrase-detection_FarsiParaphraseDetection_recall":0.6268656716,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.5933059088,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.3627075351,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.3434772816,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.3695590113,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.353505411,"paraphrase-detection_FarsiParaphraseDetection_acc":0.9220779221,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8731906218,"paraphrase-detection_FarsiParaphraseDetection_recall":0.9394957983,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8986842105,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":0.3933588761,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.877394636,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9117647059,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8567164179,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8679892098,"paraphrase-detection_FarsiParaphraseDetection_acc":0.877394636,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9117647059,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8567164179,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8679892098,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8135376756,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8710840658,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.7844142715,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.7937868553,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8240620957,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8823529412,"paraphrase-detection_FarsiParaphraseDetection_recall":0.7945619335,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8040557668,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":0.9872286079,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8697318008,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9057190558,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8481376599,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8593214965,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8697318008,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9057190558,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8481376599,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8593214965,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8378033206,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8876229723,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8118030537,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8221408221,"paraphrase-detection_FarsiParaphraseDetection_acc":0.841025641,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8910369069,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8149253731,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8253029022,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":0.9961685824,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8212005109,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.880952381,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.7910447761,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8003569607,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8212005109,"paraphrase-detection_FarsiParaphraseDetection_precision":0.880952381,"paraphrase-detection_FarsiParaphraseDetection_recall":0.7910447761,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8003569607,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8505747126,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.896460177,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8253731343,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8364641219,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8505747126,"paraphrase-detection_FarsiParaphraseDetection_precision":0.896460177,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8253731343,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8364641219,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8901660281,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9194756554,"paraphrase-detection_FarsiParaphraseDetection_recall":0.871641791,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8825816756,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8595146871,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9014336918,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8358208955,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8471137461,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8595146871,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9014336918,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8358208955,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8471137461,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":null,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":null,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":null,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":null,"paraphrase-detection_FarsiParaphraseDetection_acc":null,"paraphrase-detection_FarsiParaphraseDetection_precision":null,"paraphrase-detection_FarsiParaphraseDetection_recall":null,"paraphrase-detection_FarsiParaphraseDetection_fscore":null,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.9029374202,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9262452107,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8869436301,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.897066353,"paraphrase-detection_FarsiParaphraseDetection_acc":0.9029374202,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9262452107,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8869436301,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.897066353,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8390804598,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8902439024,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8119402985,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8225473409,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8390804598,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8902439024,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8119402985,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8225473409,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8952745849,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9226415094,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8776119403,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8883498185,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8952745849,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9226415094,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8776119403,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8883498185,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8965517241,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.9234404537,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8791044776,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8897859599,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8965517241,"paraphrase-detection_FarsiParaphraseDetection_precision":0.9234404537,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8791044776,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8897859599,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.8556832695,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8960759725,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.8314059789,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.8433777185,"paraphrase-detection_FarsiParaphraseDetection_acc":0.8634020619,"paraphrase-detection_FarsiParaphraseDetection_precision":0.904159132,"paraphrase-detection_FarsiParaphraseDetection_recall":0.8389057751,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8509855072,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":0.9910600255,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.680715198,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.8209169054,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.6268656716,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.5933059088,"paraphrase-detection_FarsiParaphraseDetection_acc":0.680715198,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8209169054,"paraphrase-detection_FarsiParaphraseDetection_recall":0.6268656716,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.5933059088,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","paraphrase-detection_FarsiParaphraseDetection_acc_modified":0.3627075351,"paraphrase-detection_FarsiParaphraseDetection_precision_modified":0.3434772816,"paraphrase-detection_FarsiParaphraseDetection_recall_modified":0.3695590113,"paraphrase-detection_FarsiParaphraseDetection_fscore_modified":0.353505411,"paraphrase-detection_FarsiParaphraseDetection_acc":0.9220779221,"paraphrase-detection_FarsiParaphraseDetection_precision":0.8731906218,"paraphrase-detection_FarsiParaphraseDetection_recall":0.9394957983,"paraphrase-detection_FarsiParaphraseDetection_fscore":0.8986842105,"paraphrase-detection_FarsiParaphraseDetection_valid_output_ratio":0.3933588761,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/paraphrase-detection_parsinlu.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.844,"paraphrase-detection_parsinlu_precision_modified":0.8671683358,"paraphrase-detection_parsinlu_recall_modified":0.8248878009,"paraphrase-detection_parsinlu_fscore_modified":0.8334216056,"paraphrase-detection_parsinlu_acc":0.844,"paraphrase-detection_parsinlu_precision":0.8671683358,"paraphrase-detection_parsinlu_recall":0.8248878009,"paraphrase-detection_parsinlu_fscore":0.8334216056,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.838,"paraphrase-detection_parsinlu_precision_modified":0.8416530278,"paraphrase-detection_parsinlu_recall_modified":0.8270501836,"paraphrase-detection_parsinlu_fscore_modified":0.8316645261,"paraphrase-detection_parsinlu_acc":0.838,"paraphrase-detection_parsinlu_precision":0.8416530278,"paraphrase-detection_parsinlu_recall":0.8270501836,"paraphrase-detection_parsinlu_fscore":0.8316645261,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.872,"paraphrase-detection_parsinlu_precision_modified":0.872593554,"paraphrase-detection_parsinlu_recall_modified":0.8654426765,"paraphrase-detection_parsinlu_fscore_modified":0.8682824025,"paraphrase-detection_parsinlu_acc":0.872,"paraphrase-detection_parsinlu_precision":0.872593554,"paraphrase-detection_parsinlu_recall":0.8654426765,"paraphrase-detection_parsinlu_fscore":0.8682824025,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.866,"paraphrase-detection_parsinlu_precision_modified":0.8771198269,"paraphrase-detection_parsinlu_recall_modified":0.852753978,"paraphrase-detection_parsinlu_fscore_modified":0.8595688134,"paraphrase-detection_parsinlu_acc":0.866,"paraphrase-detection_parsinlu_precision":0.8771198269,"paraphrase-detection_parsinlu_recall":0.852753978,"paraphrase-detection_parsinlu_fscore":0.8595688134,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.826,"paraphrase-detection_parsinlu_precision_modified":0.861267166,"paraphrase-detection_parsinlu_recall_modified":0.802243982,"paraphrase-detection_parsinlu_fscore_modified":0.8109673691,"paraphrase-detection_parsinlu_acc":0.826,"paraphrase-detection_parsinlu_precision":0.861267166,"paraphrase-detection_parsinlu_recall":0.802243982,"paraphrase-detection_parsinlu_fscore":0.8109673691,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":null,"paraphrase-detection_parsinlu_precision_modified":null,"paraphrase-detection_parsinlu_recall_modified":null,"paraphrase-detection_parsinlu_fscore_modified":null,"paraphrase-detection_parsinlu_acc":null,"paraphrase-detection_parsinlu_precision":null,"paraphrase-detection_parsinlu_recall":null,"paraphrase-detection_parsinlu_fscore":null,"paraphrase-detection_parsinlu_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.876,"paraphrase-detection_parsinlu_precision_modified":0.8806824921,"paraphrase-detection_parsinlu_recall_modified":0.8666666667,"paraphrase-detection_parsinlu_fscore_modified":0.871456768,"paraphrase-detection_parsinlu_acc":0.876,"paraphrase-detection_parsinlu_precision":0.8806824921,"paraphrase-detection_parsinlu_recall":0.8666666667,"paraphrase-detection_parsinlu_fscore":0.871456768,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.854,"paraphrase-detection_parsinlu_precision_modified":0.8742015099,"paraphrase-detection_parsinlu_recall_modified":0.8365157079,"paraphrase-detection_parsinlu_fscore_modified":0.8449177639,"paraphrase-detection_parsinlu_acc":0.854,"paraphrase-detection_parsinlu_precision":0.8742015099,"paraphrase-detection_parsinlu_recall":0.8365157079,"paraphrase-detection_parsinlu_fscore":0.8449177639,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.876,"paraphrase-detection_parsinlu_precision_modified":0.8735210118,"paraphrase-detection_parsinlu_recall_modified":0.8735210118,"paraphrase-detection_parsinlu_fscore_modified":0.8735210118,"paraphrase-detection_parsinlu_acc":0.876,"paraphrase-detection_parsinlu_precision":0.8735210118,"paraphrase-detection_parsinlu_recall":0.8735210118,"paraphrase-detection_parsinlu_fscore":0.8735210118,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.744,"paraphrase-detection_parsinlu_precision_modified":0.7517357255,"paraphrase-detection_parsinlu_recall_modified":0.7357334824,"paraphrase-detection_parsinlu_fscore_modified":0.7395,"paraphrase-detection_parsinlu_acc":0.8416289593,"paraphrase-detection_parsinlu_precision":0.85037978,"paraphrase-detection_parsinlu_recall":0.832277695,"paraphrase-detection_parsinlu_fscore":0.8365384615,"paraphrase-detection_parsinlu_valid_output_ratio":0.884,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.66,"paraphrase-detection_parsinlu_precision_modified":0.7933390651,"paraphrase-detection_parsinlu_recall_modified":0.6057935537,"paraphrase-detection_parsinlu_fscore_modified":0.5625411726,"paraphrase-detection_parsinlu_acc":0.66,"paraphrase-detection_parsinlu_precision":0.7933390651,"paraphrase-detection_parsinlu_recall":0.6057935537,"paraphrase-detection_parsinlu_fscore":0.5625411726,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.274,"paraphrase-detection_parsinlu_precision_modified":0.2627667984,"paraphrase-detection_parsinlu_recall_modified":0.2313142857,"paraphrase-detection_parsinlu_fscore_modified":0.2414462011,"paraphrase-detection_parsinlu_acc":0.85625,"paraphrase-detection_parsinlu_precision":0.8211462451,"paraphrase-detection_parsinlu_recall":0.7228571429,"paraphrase-detection_parsinlu_fscore":0.7545193783,"paraphrase-detection_parsinlu_valid_output_ratio":0.32,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.844,"paraphrase-detection_parsinlu_precision_modified":0.8671683358,"paraphrase-detection_parsinlu_recall_modified":0.8248878009,"paraphrase-detection_parsinlu_fscore_modified":0.8334216056,"paraphrase-detection_parsinlu_acc":0.844,"paraphrase-detection_parsinlu_precision":0.8671683358,"paraphrase-detection_parsinlu_recall":0.8248878009,"paraphrase-detection_parsinlu_fscore":0.8334216056,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.796,"paraphrase-detection_parsinlu_precision_modified":0.8275307297,"paraphrase-detection_parsinlu_recall_modified":0.7707807282,"paraphrase-detection_parsinlu_fscore_modified":0.7792394123,"paraphrase-detection_parsinlu_acc":0.8139059305,"paraphrase-detection_parsinlu_precision":0.8461459404,"paraphrase-detection_parsinlu_recall":0.788119354,"paraphrase-detection_parsinlu_fscore":0.7967683152,"paraphrase-detection_parsinlu_valid_output_ratio":0.978,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.838,"paraphrase-detection_parsinlu_precision_modified":0.8416530278,"paraphrase-detection_parsinlu_recall_modified":0.8270501836,"paraphrase-detection_parsinlu_fscore_modified":0.8316645261,"paraphrase-detection_parsinlu_acc":0.838,"paraphrase-detection_parsinlu_precision":0.8416530278,"paraphrase-detection_parsinlu_recall":0.8270501836,"paraphrase-detection_parsinlu_fscore":0.8316645261,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.872,"paraphrase-detection_parsinlu_precision_modified":0.872593554,"paraphrase-detection_parsinlu_recall_modified":0.8654426765,"paraphrase-detection_parsinlu_fscore_modified":0.8682824025,"paraphrase-detection_parsinlu_acc":0.872,"paraphrase-detection_parsinlu_precision":0.872593554,"paraphrase-detection_parsinlu_recall":0.8654426765,"paraphrase-detection_parsinlu_fscore":0.8682824025,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.812,"paraphrase-detection_parsinlu_precision_modified":0.8560421519,"paraphrase-detection_parsinlu_recall_modified":0.7853480321,"paraphrase-detection_parsinlu_fscore_modified":0.7936411239,"paraphrase-detection_parsinlu_acc":0.8152610442,"paraphrase-detection_parsinlu_precision":0.8594800722,"paraphrase-detection_parsinlu_recall":0.7885020403,"paraphrase-detection_parsinlu_fscore":0.7968284376,"paraphrase-detection_parsinlu_valid_output_ratio":0.996,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.78,"paraphrase-detection_parsinlu_precision_modified":0.8453499806,"paraphrase-detection_parsinlu_recall_modified":0.7464708282,"paraphrase-detection_parsinlu_fscore_modified":0.7504718351,"paraphrase-detection_parsinlu_acc":0.78,"paraphrase-detection_parsinlu_precision":0.8453499806,"paraphrase-detection_parsinlu_recall":0.7464708282,"paraphrase-detection_parsinlu_fscore":0.7504718351,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.814,"paraphrase-detection_parsinlu_precision_modified":0.8536111778,"paraphrase-detection_parsinlu_recall_modified":0.7882904937,"paraphrase-detection_parsinlu_fscore_modified":0.7964017847,"paraphrase-detection_parsinlu_acc":0.814,"paraphrase-detection_parsinlu_precision":0.8536111778,"paraphrase-detection_parsinlu_recall":0.7882904937,"paraphrase-detection_parsinlu_fscore":0.7964017847,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.866,"paraphrase-detection_parsinlu_precision_modified":0.8771198269,"paraphrase-detection_parsinlu_recall_modified":0.852753978,"paraphrase-detection_parsinlu_fscore_modified":0.8595688134,"paraphrase-detection_parsinlu_acc":0.866,"paraphrase-detection_parsinlu_precision":0.8771198269,"paraphrase-detection_parsinlu_recall":0.852753978,"paraphrase-detection_parsinlu_fscore":0.8595688134,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.826,"paraphrase-detection_parsinlu_precision_modified":0.861267166,"paraphrase-detection_parsinlu_recall_modified":0.802243982,"paraphrase-detection_parsinlu_fscore_modified":0.8109673691,"paraphrase-detection_parsinlu_acc":0.826,"paraphrase-detection_parsinlu_precision":0.861267166,"paraphrase-detection_parsinlu_recall":0.802243982,"paraphrase-detection_parsinlu_fscore":0.8109673691,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":null,"paraphrase-detection_parsinlu_precision_modified":null,"paraphrase-detection_parsinlu_recall_modified":null,"paraphrase-detection_parsinlu_fscore_modified":null,"paraphrase-detection_parsinlu_acc":null,"paraphrase-detection_parsinlu_precision":null,"paraphrase-detection_parsinlu_recall":null,"paraphrase-detection_parsinlu_fscore":null,"paraphrase-detection_parsinlu_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.876,"paraphrase-detection_parsinlu_precision_modified":0.8806824921,"paraphrase-detection_parsinlu_recall_modified":0.8666666667,"paraphrase-detection_parsinlu_fscore_modified":0.871456768,"paraphrase-detection_parsinlu_acc":0.876,"paraphrase-detection_parsinlu_precision":0.8806824921,"paraphrase-detection_parsinlu_recall":0.8666666667,"paraphrase-detection_parsinlu_fscore":0.871456768,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.854,"paraphrase-detection_parsinlu_precision_modified":0.8742015099,"paraphrase-detection_parsinlu_recall_modified":0.8365157079,"paraphrase-detection_parsinlu_fscore_modified":0.8449177639,"paraphrase-detection_parsinlu_acc":0.854,"paraphrase-detection_parsinlu_precision":0.8742015099,"paraphrase-detection_parsinlu_recall":0.8365157079,"paraphrase-detection_parsinlu_fscore":0.8449177639,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.876,"paraphrase-detection_parsinlu_precision_modified":0.8735210118,"paraphrase-detection_parsinlu_recall_modified":0.8735210118,"paraphrase-detection_parsinlu_fscore_modified":0.8735210118,"paraphrase-detection_parsinlu_acc":0.876,"paraphrase-detection_parsinlu_precision":0.8735210118,"paraphrase-detection_parsinlu_recall":0.8735210118,"paraphrase-detection_parsinlu_fscore":0.8735210118,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.86,"paraphrase-detection_parsinlu_precision_modified":0.8618019568,"paraphrase-detection_parsinlu_recall_modified":0.8516299393,"paraphrase-detection_parsinlu_fscore_modified":0.8553599196,"paraphrase-detection_parsinlu_acc":0.8617234469,"paraphrase-detection_parsinlu_precision":0.8635290148,"paraphrase-detection_parsinlu_recall":0.8533366126,"paraphrase-detection_parsinlu_fscore":0.8570740678,"paraphrase-detection_parsinlu_valid_output_ratio":0.998,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","paraphrase-detection_parsinlu_acc_modified":0.744,"paraphrase-detection_parsinlu_precision_modified":0.7517357255,"paraphrase-detection_parsinlu_recall_modified":0.7357334824,"paraphrase-detection_parsinlu_fscore_modified":0.7395,"paraphrase-detection_parsinlu_acc":0.8416289593,"paraphrase-detection_parsinlu_precision":0.85037978,"paraphrase-detection_parsinlu_recall":0.832277695,"paraphrase-detection_parsinlu_fscore":0.8365384615,"paraphrase-detection_parsinlu_valid_output_ratio":0.884,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.66,"paraphrase-detection_parsinlu_precision_modified":0.7933390651,"paraphrase-detection_parsinlu_recall_modified":0.6057935537,"paraphrase-detection_parsinlu_fscore_modified":0.5625411726,"paraphrase-detection_parsinlu_acc":0.66,"paraphrase-detection_parsinlu_precision":0.7933390651,"paraphrase-detection_parsinlu_recall":0.6057935537,"paraphrase-detection_parsinlu_fscore":0.5625411726,"paraphrase-detection_parsinlu_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","paraphrase-detection_parsinlu_acc_modified":0.274,"paraphrase-detection_parsinlu_precision_modified":0.2627667984,"paraphrase-detection_parsinlu_recall_modified":0.2313142857,"paraphrase-detection_parsinlu_fscore_modified":0.2414462011,"paraphrase-detection_parsinlu_acc":0.85625,"paraphrase-detection_parsinlu_precision":0.8211462451,"paraphrase-detection_parsinlu_recall":0.7228571429,"paraphrase-detection_parsinlu_fscore":0.7545193783,"paraphrase-detection_parsinlu_valid_output_ratio":0.32,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/persian_csr.jsonl
    CHANGED
    
    | @@ -4,6 +4,7 @@ | |
| 4 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8839,"acc_strict":0.8839,"donyaeeqtesad_acc":0.8610271903,"isna_acc":0.8359375,"ninisite_article_acc":0.8702702703,"virgool_4_acc":0.9033232628,"khabaronline_acc":0.884,"digiato_acc":0.8705636743,"doctoreto_acc":0.885,"sarzamindownload_acc":0.8562091503,"hamgardi_acc":0.8377581121,"bigbangpage_acc":0.923566879,"wiki_ahlolbait_acc":0.9276315789,"virgool_3_acc":0.9104477612,"virgool_2_acc":0.8837920489,"virgool_1_acc":0.8607594937,"hamshahrionline_acc":0.9114754098,"tabnak_acc":0.887966805,"alibaba_acc":0.9117647059,"digikala_mag_acc":0.9118236473,"yjc_acc":0.867816092,"beytoote_acc":0.91966759,"asriran_acc":0.8792270531,"ecoiran_acc":0.8634920635,"hawzah_acc":0.9269662921,"zoomit_acc":0.9154929577,"wikipedia_acc":0.9428571429,"namnak_acc":0.8583106267,"khodro45_acc":0.8602941176,"fidibo_acc":0.9074889868,"newmiind_acc":0.8020833333,"taaghche_acc":0.8974358974,"motamem_acc":0.9263157895,"varzesh3_acc":0.9096989967,"mehrnews_acc":0.8508064516,"tasnim_acc":0.8307692308,"magerta_acc":0.8403361345,"radiokodak_book_acc":0.8695652174,"vipofilm_acc":1.0,"wikishia_acc":1.0,"voolak_acc":0.8837209302,"farsroid_acc":0.8421052632,"parsiday_acc":0.8833333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.9}
         | 
| 5 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8717,"acc_strict":0.8714,"donyaeeqtesad_acc":0.8700906344,"isna_acc":0.8671875,"ninisite_article_acc":0.8621621622,"virgool_4_acc":0.9033232628,"khabaronline_acc":0.852,"digiato_acc":0.8747390397,"doctoreto_acc":0.9,"sarzamindownload_acc":0.8562091503,"hamgardi_acc":0.8230088496,"bigbangpage_acc":0.898089172,"wiki_ahlolbait_acc":0.8881578947,"virgool_3_acc":0.9104477612,"virgool_2_acc":0.8929663609,"virgool_1_acc":0.8765822785,"hamshahrionline_acc":0.8786885246,"tabnak_acc":0.8755186722,"alibaba_acc":0.9183006536,"digikala_mag_acc":0.8977955912,"yjc_acc":0.8563218391,"beytoote_acc":0.8864265928,"asriran_acc":0.8212560386,"ecoiran_acc":0.8476190476,"hawzah_acc":0.8960674157,"zoomit_acc":0.9084507042,"wikipedia_acc":0.9238095238,"namnak_acc":0.8310626703,"khodro45_acc":0.8382352941,"fidibo_acc":0.9207048458,"newmiind_acc":0.8194444444,"taaghche_acc":0.9038461538,"motamem_acc":0.9368421053,"varzesh3_acc":0.8829431438,"mehrnews_acc":0.8064516129,"tasnim_acc":0.8692307692,"magerta_acc":0.7605042017,"radiokodak_book_acc":0.8260869565,"vipofilm_acc":0.9230769231,"wikishia_acc":0.9393939394,"voolak_acc":0.8372093023,"farsroid_acc":0.7894736842,"parsiday_acc":0.775,"soft98_acc":0.9,"ninisite_discussion_acc":0.8}
         | 
| 6 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8665,"acc_strict":0.7832,"donyaeeqtesad_acc":0.8459214502,"isna_acc":0.8359375,"ninisite_article_acc":0.8594594595,"virgool_4_acc":0.8882175227,"khabaronline_acc":0.896,"digiato_acc":0.8496868476,"doctoreto_acc":0.855,"sarzamindownload_acc":0.8235294118,"hamgardi_acc":0.8200589971,"bigbangpage_acc":0.9171974522,"wiki_ahlolbait_acc":0.9342105263,"virgool_3_acc":0.8656716418,"virgool_2_acc":0.8837920489,"virgool_1_acc":0.8892405063,"hamshahrionline_acc":0.9409836066,"tabnak_acc":0.887966805,"alibaba_acc":0.8529411765,"digikala_mag_acc":0.8817635271,"yjc_acc":0.8103448276,"beytoote_acc":0.8891966759,"asriran_acc":0.8550724638,"ecoiran_acc":0.8126984127,"hawzah_acc":0.9129213483,"zoomit_acc":0.9084507042,"wikipedia_acc":0.9285714286,"namnak_acc":0.8446866485,"khodro45_acc":0.8455882353,"fidibo_acc":0.872246696,"newmiind_acc":0.8125,"taaghche_acc":0.9038461538,"motamem_acc":0.9157894737,"varzesh3_acc":0.8996655518,"mehrnews_acc":0.814516129,"tasnim_acc":0.8461538462,"magerta_acc":0.781512605,"radiokodak_book_acc":0.7826086957,"vipofilm_acc":0.9230769231,"wikishia_acc":0.9696969697,"voolak_acc":0.7674418605,"farsroid_acc":0.7105263158,"parsiday_acc":0.85,"soft98_acc":0.8,"ninisite_discussion_acc":0.9}
         | 
|  | |
| 7 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8637863786,"acc_strict":0.8637863786,"donyaeeqtesad_acc":0.8398791541,"isna_acc":0.828125,"ninisite_article_acc":0.8243243243,"virgool_4_acc":0.8851963746,"khabaronline_acc":0.84,"digiato_acc":0.8747390397,"doctoreto_acc":0.895,"sarzamindownload_acc":0.8366013072,"hamgardi_acc":0.802359882,"bigbangpage_acc":0.898089172,"wiki_ahlolbait_acc":0.9407894737,"virgool_3_acc":0.8955223881,"virgool_2_acc":0.8899082569,"virgool_1_acc":0.8892405063,"hamshahrionline_acc":0.8754098361,"tabnak_acc":0.8755186722,"alibaba_acc":0.8426229508,"digikala_mag_acc":0.877755511,"yjc_acc":0.816091954,"beytoote_acc":0.8836565097,"asriran_acc":0.8888888889,"ecoiran_acc":0.8126984127,"hawzah_acc":0.8904494382,"zoomit_acc":0.9084507042,"wikipedia_acc":0.919047619,"namnak_acc":0.8392370572,"khodro45_acc":0.8823529412,"fidibo_acc":0.9030837004,"newmiind_acc":0.8125,"taaghche_acc":0.9423076923,"motamem_acc":0.9157894737,"varzesh3_acc":0.8929765886,"mehrnews_acc":0.8427419355,"tasnim_acc":0.8153846154,"magerta_acc":0.7773109244,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":1.0,"wikishia_acc":0.9696969697,"voolak_acc":0.7441860465,"farsroid_acc":0.7894736842,"parsiday_acc":0.8166666667,"soft98_acc":1.0,"ninisite_discussion_acc":0.9}
         | 
| 8 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8551,"acc_strict":0.8551,"donyaeeqtesad_acc":0.8429003021,"isna_acc":0.828125,"ninisite_article_acc":0.8540540541,"virgool_4_acc":0.8610271903,"khabaronline_acc":0.84,"digiato_acc":0.8830897704,"doctoreto_acc":0.87,"sarzamindownload_acc":0.8758169935,"hamgardi_acc":0.796460177,"bigbangpage_acc":0.8853503185,"wiki_ahlolbait_acc":0.9013157895,"virgool_3_acc":0.871641791,"virgool_2_acc":0.9051987768,"virgool_1_acc":0.8481012658,"hamshahrionline_acc":0.8786885246,"tabnak_acc":0.8713692946,"alibaba_acc":0.8758169935,"digikala_mag_acc":0.879759519,"yjc_acc":0.7988505747,"beytoote_acc":0.8753462604,"asriran_acc":0.8260869565,"ecoiran_acc":0.8031746032,"hawzah_acc":0.8511235955,"zoomit_acc":0.8849765258,"wikipedia_acc":0.9285714286,"namnak_acc":0.8310626703,"khodro45_acc":0.8897058824,"fidibo_acc":0.872246696,"newmiind_acc":0.7881944444,"taaghche_acc":0.8974358974,"motamem_acc":0.9157894737,"varzesh3_acc":0.8762541806,"mehrnews_acc":0.8346774194,"tasnim_acc":0.8269230769,"magerta_acc":0.7941176471,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":0.7692307692,"wikishia_acc":0.9393939394,"voolak_acc":0.8372093023,"farsroid_acc":0.8157894737,"parsiday_acc":0.7583333333,"soft98_acc":0.8,"ninisite_discussion_acc":0.3}
         | 
| 9 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","acc":0.825165033,"acc_strict":0.825165033,"donyaeeqtesad_acc":0.8247734139,"isna_acc":0.8046875,"ninisite_article_acc":0.8594594595,"virgool_4_acc":0.8580060423,"khabaronline_acc":0.78,"digiato_acc":0.8267223382,"doctoreto_acc":0.835,"sarzamindownload_acc":0.7908496732,"hamgardi_acc":0.808259587,"bigbangpage_acc":0.9044585987,"wiki_ahlolbait_acc":0.9006622517,"virgool_3_acc":0.8268656716,"virgool_2_acc":0.8348623853,"virgool_1_acc":0.7911392405,"hamshahrionline_acc":0.8651315789,"tabnak_acc":0.8215767635,"alibaba_acc":0.8169934641,"digikala_mag_acc":0.8336673347,"yjc_acc":0.7873563218,"beytoote_acc":0.8310249307,"asriran_acc":0.8212560386,"ecoiran_acc":0.7523809524,"hawzah_acc":0.8735955056,"zoomit_acc":0.8450704225,"wikipedia_acc":0.9,"namnak_acc":0.8337874659,"khodro45_acc":0.8088235294,"fidibo_acc":0.845814978,"newmiind_acc":0.7604166667,"taaghche_acc":0.891025641,"motamem_acc":0.8947368421,"varzesh3_acc":0.8093645485,"mehrnews_acc":0.7782258065,"tasnim_acc":0.8115384615,"magerta_acc":0.7647058824,"radiokodak_book_acc":0.6086956522,"vipofilm_acc":0.9230769231,"wikishia_acc":0.9393939394,"voolak_acc":0.8372093023,"farsroid_acc":0.7368421053,"parsiday_acc":0.7583333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.7}
         | 
| @@ -11,13 +12,17 @@ | |
| 11 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8143,"acc_strict":0.8143,"donyaeeqtesad_acc":0.7975830816,"isna_acc":0.77734375,"ninisite_article_acc":0.8,"virgool_4_acc":0.833836858,"khabaronline_acc":0.796,"digiato_acc":0.8037578288,"doctoreto_acc":0.82,"sarzamindownload_acc":0.7712418301,"hamgardi_acc":0.7669616519,"bigbangpage_acc":0.8598726115,"wiki_ahlolbait_acc":0.8947368421,"virgool_3_acc":0.8298507463,"virgool_2_acc":0.8409785933,"virgool_1_acc":0.8196202532,"hamshahrionline_acc":0.8557377049,"tabnak_acc":0.8215767635,"alibaba_acc":0.8202614379,"digikala_mag_acc":0.8176352705,"yjc_acc":0.8045977011,"beytoote_acc":0.811634349,"asriran_acc":0.7874396135,"ecoiran_acc":0.7682539683,"hawzah_acc":0.8511235955,"zoomit_acc":0.8474178404,"wikipedia_acc":0.8952380952,"namnak_acc":0.7847411444,"khodro45_acc":0.8382352941,"fidibo_acc":0.845814978,"newmiind_acc":0.7708333333,"taaghche_acc":0.8525641026,"motamem_acc":0.9157894737,"varzesh3_acc":0.8394648829,"mehrnews_acc":0.7459677419,"tasnim_acc":0.8230769231,"magerta_acc":0.7478991597,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":1.0,"wikishia_acc":1.0,"voolak_acc":0.7906976744,"farsroid_acc":0.7105263158,"parsiday_acc":0.7416666667,"soft98_acc":0.9,"ninisite_discussion_acc":0.6}
         | 
| 12 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","acc":0.798859772,"acc_strict":0.7983596719,"donyaeeqtesad_acc":0.7673716012,"isna_acc":0.76953125,"ninisite_article_acc":0.7696476965,"virgool_4_acc":0.8398791541,"khabaronline_acc":0.78,"digiato_acc":0.7870563674,"doctoreto_acc":0.82,"sarzamindownload_acc":0.7712418301,"hamgardi_acc":0.7610619469,"bigbangpage_acc":0.8789808917,"wiki_ahlolbait_acc":0.8486842105,"virgool_3_acc":0.8119402985,"virgool_2_acc":0.8226299694,"virgool_1_acc":0.8037974684,"hamshahrionline_acc":0.8557377049,"tabnak_acc":0.8298755187,"alibaba_acc":0.8562091503,"digikala_mag_acc":0.8152610442,"yjc_acc":0.7471264368,"beytoote_acc":0.8005540166,"asriran_acc":0.7922705314,"ecoiran_acc":0.7333333333,"hawzah_acc":0.8342696629,"zoomit_acc":0.8427230047,"wikipedia_acc":0.9095238095,"namnak_acc":0.7738419619,"khodro45_acc":0.8088235294,"fidibo_acc":0.845814978,"newmiind_acc":0.7222222222,"taaghche_acc":0.8397435897,"motamem_acc":0.8947368421,"varzesh3_acc":0.7993311037,"mehrnews_acc":0.7338709677,"tasnim_acc":0.7730769231,"magerta_acc":0.6974789916,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8484848485,"voolak_acc":0.7441860465,"farsroid_acc":0.6578947368,"parsiday_acc":0.7166666667,"soft98_acc":0.8,"ninisite_discussion_acc":0.6}
         | 
| 13 | 
             
            {"Model Name":"Llama-3.3-70B-Instruct","thinking_method":"β","model_url":"https_google.com","parameters_count":"70600000000","source_type":"Open-Source","acc":0.7956,"acc_strict":0.1123,"donyaeeqtesad_acc":0.7764350453,"isna_acc":0.76171875,"ninisite_article_acc":0.772972973,"virgool_4_acc":0.8549848943,"khabaronline_acc":0.78,"digiato_acc":0.7954070981,"doctoreto_acc":0.755,"sarzamindownload_acc":0.7385620915,"hamgardi_acc":0.7492625369,"bigbangpage_acc":0.8407643312,"wiki_ahlolbait_acc":0.8421052632,"virgool_3_acc":0.8029850746,"virgool_2_acc":0.8287461774,"virgool_1_acc":0.8259493671,"hamshahrionline_acc":0.862295082,"tabnak_acc":0.8257261411,"alibaba_acc":0.8366013072,"digikala_mag_acc":0.8076152305,"yjc_acc":0.7356321839,"beytoote_acc":0.7922437673,"asriran_acc":0.7874396135,"ecoiran_acc":0.7142857143,"hawzah_acc":0.845505618,"zoomit_acc":0.8403755869,"wikipedia_acc":0.9047619048,"namnak_acc":0.7874659401,"khodro45_acc":0.7941176471,"fidibo_acc":0.8414096916,"newmiind_acc":0.7465277778,"taaghche_acc":0.8076923077,"motamem_acc":0.8947368421,"varzesh3_acc":0.7959866221,"mehrnews_acc":0.7419354839,"tasnim_acc":0.7346153846,"magerta_acc":0.6848739496,"radiokodak_book_acc":0.6086956522,"vipofilm_acc":0.8461538462,"wikishia_acc":0.8787878788,"voolak_acc":0.7906976744,"farsroid_acc":0.6578947368,"parsiday_acc":0.7583333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.5}
         | 
|  | |
| 14 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7712,"acc_strict":0.7712,"donyaeeqtesad_acc":0.7703927492,"isna_acc":0.75390625,"ninisite_article_acc":0.7648648649,"virgool_4_acc":0.8247734139,"khabaronline_acc":0.76,"digiato_acc":0.7745302714,"doctoreto_acc":0.785,"sarzamindownload_acc":0.7581699346,"hamgardi_acc":0.6784660767,"bigbangpage_acc":0.8407643312,"wiki_ahlolbait_acc":0.8223684211,"virgool_3_acc":0.7910447761,"virgool_2_acc":0.7920489297,"virgool_1_acc":0.7943037975,"hamshahrionline_acc":0.8295081967,"tabnak_acc":0.7634854772,"alibaba_acc":0.7973856209,"digikala_mag_acc":0.8056112224,"yjc_acc":0.724137931,"beytoote_acc":0.7783933518,"asriran_acc":0.7777777778,"ecoiran_acc":0.7079365079,"hawzah_acc":0.7724719101,"zoomit_acc":0.8098591549,"wikipedia_acc":0.8761904762,"namnak_acc":0.7547683924,"khodro45_acc":0.7941176471,"fidibo_acc":0.7841409692,"newmiind_acc":0.6875,"taaghche_acc":0.8269230769,"motamem_acc":0.8631578947,"varzesh3_acc":0.7926421405,"mehrnews_acc":0.7056451613,"tasnim_acc":0.7076923077,"magerta_acc":0.6890756303,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.8461538462,"wikishia_acc":0.8181818182,"voolak_acc":0.6279069767,"farsroid_acc":0.6578947368,"parsiday_acc":0.7083333333,"soft98_acc":0.7,"ninisite_discussion_acc":0.5}
         | 
| 15 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","acc":0.7654,"acc_strict":0.7653,"donyaeeqtesad_acc":0.749244713,"isna_acc":0.75,"ninisite_article_acc":0.7621621622,"virgool_4_acc":0.7824773414,"khabaronline_acc":0.724,"digiato_acc":0.8037578288,"doctoreto_acc":0.8,"sarzamindownload_acc":0.7450980392,"hamgardi_acc":0.6991150442,"bigbangpage_acc":0.8025477707,"wiki_ahlolbait_acc":0.8157894737,"virgool_3_acc":0.8029850746,"virgool_2_acc":0.8073394495,"virgool_1_acc":0.7943037975,"hamshahrionline_acc":0.8,"tabnak_acc":0.7634854772,"alibaba_acc":0.8039215686,"digikala_mag_acc":0.7875751503,"yjc_acc":0.6896551724,"beytoote_acc":0.7783933518,"asriran_acc":0.7632850242,"ecoiran_acc":0.6793650794,"hawzah_acc":0.7724719101,"zoomit_acc":0.8215962441,"wikipedia_acc":0.8523809524,"namnak_acc":0.7520435967,"khodro45_acc":0.8088235294,"fidibo_acc":0.7665198238,"newmiind_acc":0.6909722222,"taaghche_acc":0.7564102564,"motamem_acc":0.8736842105,"varzesh3_acc":0.762541806,"mehrnews_acc":0.689516129,"tasnim_acc":0.7192307692,"magerta_acc":0.7268907563,"radiokodak_book_acc":0.5217391304,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8484848485,"voolak_acc":0.6744186047,"farsroid_acc":0.6578947368,"parsiday_acc":0.675,"soft98_acc":0.7,"ninisite_discussion_acc":0.7}
         | 
|  | |
| 16 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","acc":0.7628,"acc_strict":0.7628,"donyaeeqtesad_acc":0.6978851964,"isna_acc":0.7265625,"ninisite_article_acc":0.7621621622,"virgool_4_acc":0.8187311178,"khabaronline_acc":0.74,"digiato_acc":0.7661795407,"doctoreto_acc":0.78,"sarzamindownload_acc":0.6993464052,"hamgardi_acc":0.7109144543,"bigbangpage_acc":0.821656051,"wiki_ahlolbait_acc":0.8026315789,"virgool_3_acc":0.7940298507,"virgool_2_acc":0.755351682,"virgool_1_acc":0.7784810127,"hamshahrionline_acc":0.8229508197,"tabnak_acc":0.8174273859,"alibaba_acc":0.7843137255,"digikala_mag_acc":0.7975951904,"yjc_acc":0.7126436782,"beytoote_acc":0.7534626039,"asriran_acc":0.7391304348,"ecoiran_acc":0.7079365079,"hawzah_acc":0.7752808989,"zoomit_acc":0.7957746479,"wikipedia_acc":0.8428571429,"namnak_acc":0.7493188011,"khodro45_acc":0.7867647059,"fidibo_acc":0.8237885463,"newmiind_acc":0.6909722222,"taaghche_acc":0.7820512821,"motamem_acc":0.8315789474,"varzesh3_acc":0.7993311037,"mehrnews_acc":0.6975806452,"tasnim_acc":0.7307692308,"magerta_acc":0.6722689076,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":0.8461538462,"wikishia_acc":0.9393939394,"voolak_acc":0.6976744186,"farsroid_acc":0.6315789474,"parsiday_acc":0.7,"soft98_acc":0.8,"ninisite_discussion_acc":0.7}
         | 
| 17 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7598,"acc_strict":0.7598,"donyaeeqtesad_acc":0.749244713,"isna_acc":0.71484375,"ninisite_article_acc":0.7351351351,"virgool_4_acc":0.8006042296,"khabaronline_acc":0.736,"digiato_acc":0.7599164927,"doctoreto_acc":0.775,"sarzamindownload_acc":0.6535947712,"hamgardi_acc":0.7197640118,"bigbangpage_acc":0.7961783439,"wiki_ahlolbait_acc":0.8289473684,"virgool_3_acc":0.7492537313,"virgool_2_acc":0.7828746177,"virgool_1_acc":0.8006329114,"hamshahrionline_acc":0.8131147541,"tabnak_acc":0.7427385892,"alibaba_acc":0.7810457516,"digikala_mag_acc":0.7615230461,"yjc_acc":0.7643678161,"beytoote_acc":0.7783933518,"asriran_acc":0.7536231884,"ecoiran_acc":0.6952380952,"hawzah_acc":0.7668539326,"zoomit_acc":0.7957746479,"wikipedia_acc":0.8761904762,"namnak_acc":0.7765667575,"khodro45_acc":0.7573529412,"fidibo_acc":0.7621145374,"newmiind_acc":0.6909722222,"taaghche_acc":0.7820512821,"motamem_acc":0.8736842105,"varzesh3_acc":0.8060200669,"mehrnews_acc":0.6733870968,"tasnim_acc":0.75,"magerta_acc":0.6764705882,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.8461538462,"wikishia_acc":0.8484848485,"voolak_acc":0.7441860465,"farsroid_acc":0.7631578947,"parsiday_acc":0.7083333333,"soft98_acc":0.8,"ninisite_discussion_acc":0.4}
         | 
| 18 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https_google.com","parameters_count":"104000000000","source_type":"Open-Source","acc":0.7364,"acc_strict":0.7364,"donyaeeqtesad_acc":0.752265861,"isna_acc":0.67578125,"ninisite_article_acc":0.7054054054,"virgool_4_acc":0.746223565,"khabaronline_acc":0.724,"digiato_acc":0.7223382046,"doctoreto_acc":0.7,"sarzamindownload_acc":0.6993464052,"hamgardi_acc":0.7020648968,"bigbangpage_acc":0.8089171975,"wiki_ahlolbait_acc":0.8486842105,"virgool_3_acc":0.7194029851,"virgool_2_acc":0.7339449541,"virgool_1_acc":0.7246835443,"hamshahrionline_acc":0.8262295082,"tabnak_acc":0.7178423237,"alibaba_acc":0.7712418301,"digikala_mag_acc":0.7715430862,"yjc_acc":0.7183908046,"beytoote_acc":0.7479224377,"asriran_acc":0.768115942,"ecoiran_acc":0.6698412698,"hawzah_acc":0.7415730337,"zoomit_acc":0.79342723,"wikipedia_acc":0.819047619,"namnak_acc":0.7220708447,"khodro45_acc":0.75,"fidibo_acc":0.7665198238,"newmiind_acc":0.6631944444,"taaghche_acc":0.7820512821,"motamem_acc":0.8631578947,"varzesh3_acc":0.7525083612,"mehrnews_acc":0.6653225806,"tasnim_acc":0.75,"magerta_acc":0.6134453782,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8787878788,"voolak_acc":0.6511627907,"farsroid_acc":0.5,"parsiday_acc":0.7083333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.7}
         | 
|  | |
| 19 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7160432086,"acc_strict":0.7160432086,"donyaeeqtesad_acc":0.6888217523,"isna_acc":0.69140625,"ninisite_article_acc":0.7,"virgool_4_acc":0.7311178248,"khabaronline_acc":0.712,"digiato_acc":0.7181628392,"doctoreto_acc":0.745,"sarzamindownload_acc":0.6013071895,"hamgardi_acc":0.6755162242,"bigbangpage_acc":0.7770700637,"wiki_ahlolbait_acc":0.8684210526,"virgool_3_acc":0.7194029851,"virgool_2_acc":0.7064220183,"virgool_1_acc":0.7056962025,"hamshahrionline_acc":0.7803278689,"tabnak_acc":0.6887966805,"alibaba_acc":0.7483660131,"digikala_mag_acc":0.7434869739,"yjc_acc":0.6724137931,"beytoote_acc":0.728531856,"asriran_acc":0.7487922705,"ecoiran_acc":0.6761904762,"hawzah_acc":0.7584269663,"zoomit_acc":0.7558685446,"wikipedia_acc":0.780952381,"namnak_acc":0.7002724796,"khodro45_acc":0.7279411765,"fidibo_acc":0.7665198238,"newmiind_acc":0.6202090592,"taaghche_acc":0.7628205128,"motamem_acc":0.8404255319,"varzesh3_acc":0.7324414716,"mehrnews_acc":0.6169354839,"tasnim_acc":0.6923076923,"magerta_acc":0.6680672269,"radiokodak_book_acc":0.5652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.7878787879,"voolak_acc":0.6511627907,"farsroid_acc":0.7105263158,"parsiday_acc":0.575,"soft98_acc":0.9,"ninisite_discussion_acc":0.3}
         | 
| 20 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","acc":0.7094,"acc_strict":0.7094,"donyaeeqtesad_acc":0.6586102719,"isna_acc":0.65625,"ninisite_article_acc":0.7243243243,"virgool_4_acc":0.7643504532,"khabaronline_acc":0.704,"digiato_acc":0.7369519833,"doctoreto_acc":0.76,"sarzamindownload_acc":0.6797385621,"hamgardi_acc":0.6666666667,"bigbangpage_acc":0.7515923567,"wiki_ahlolbait_acc":0.7631578947,"virgool_3_acc":0.7223880597,"virgool_2_acc":0.7584097859,"virgool_1_acc":0.7183544304,"hamshahrionline_acc":0.7213114754,"tabnak_acc":0.7219917012,"alibaba_acc":0.6830065359,"digikala_mag_acc":0.7354709419,"yjc_acc":0.6206896552,"beytoote_acc":0.7146814404,"asriran_acc":0.7198067633,"ecoiran_acc":0.6603174603,"hawzah_acc":0.702247191,"zoomit_acc":0.7323943662,"wikipedia_acc":0.7714285714,"namnak_acc":0.7329700272,"khodro45_acc":0.7352941176,"fidibo_acc":0.718061674,"newmiind_acc":0.6493055556,"taaghche_acc":0.7564102564,"motamem_acc":0.8210526316,"varzesh3_acc":0.7157190635,"mehrnews_acc":0.6088709677,"tasnim_acc":0.6576923077,"magerta_acc":0.6302521008,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8787878788,"voolak_acc":0.6976744186,"farsroid_acc":0.7368421053,"parsiday_acc":0.6583333333,"soft98_acc":0.8,"ninisite_discussion_acc":0.8}
         | 
|  | |
| 21 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","acc":0.6958,"acc_strict":0.6958,"donyaeeqtesad_acc":0.6495468278,"isna_acc":0.62890625,"ninisite_article_acc":0.6972972973,"virgool_4_acc":0.7069486405,"khabaronline_acc":0.652,"digiato_acc":0.7202505219,"doctoreto_acc":0.77,"sarzamindownload_acc":0.614379085,"hamgardi_acc":0.6430678466,"bigbangpage_acc":0.7579617834,"wiki_ahlolbait_acc":0.7631578947,"virgool_3_acc":0.7373134328,"virgool_2_acc":0.7155963303,"virgool_1_acc":0.7278481013,"hamshahrionline_acc":0.7278688525,"tabnak_acc":0.6970954357,"alibaba_acc":0.7254901961,"digikala_mag_acc":0.7074148297,"yjc_acc":0.6379310345,"beytoote_acc":0.6842105263,"asriran_acc":0.6859903382,"ecoiran_acc":0.653968254,"hawzah_acc":0.7078651685,"zoomit_acc":0.7676056338,"wikipedia_acc":0.8142857143,"namnak_acc":0.6621253406,"khodro45_acc":0.7647058824,"fidibo_acc":0.731277533,"newmiind_acc":0.6597222222,"taaghche_acc":0.6987179487,"motamem_acc":0.8105263158,"varzesh3_acc":0.6220735786,"mehrnews_acc":0.625,"tasnim_acc":0.6692307692,"magerta_acc":0.6596638655,"radiokodak_book_acc":0.5652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8787878788,"voolak_acc":0.6279069767,"farsroid_acc":0.6052631579,"parsiday_acc":0.5666666667,"soft98_acc":0.9,"ninisite_discussion_acc":0.7}
         | 
| 22 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","acc":0.6894,"acc_strict":0.6894,"donyaeeqtesad_acc":0.670694864,"isna_acc":0.63671875,"ninisite_article_acc":0.6945945946,"virgool_4_acc":0.7039274924,"khabaronline_acc":0.664,"digiato_acc":0.6826722338,"doctoreto_acc":0.755,"sarzamindownload_acc":0.6339869281,"hamgardi_acc":0.6342182891,"bigbangpage_acc":0.7452229299,"wiki_ahlolbait_acc":0.7697368421,"virgool_3_acc":0.7014925373,"virgool_2_acc":0.7125382263,"virgool_1_acc":0.7341772152,"hamshahrionline_acc":0.7278688525,"tabnak_acc":0.6307053942,"alibaba_acc":0.7647058824,"digikala_mag_acc":0.7174348697,"yjc_acc":0.5804597701,"beytoote_acc":0.6814404432,"asriran_acc":0.6811594203,"ecoiran_acc":0.6158730159,"hawzah_acc":0.6994382022,"zoomit_acc":0.7441314554,"wikipedia_acc":0.8333333333,"namnak_acc":0.659400545,"khodro45_acc":0.7058823529,"fidibo_acc":0.7268722467,"newmiind_acc":0.6527777778,"taaghche_acc":0.7051282051,"motamem_acc":0.8526315789,"varzesh3_acc":0.6789297659,"mehrnews_acc":0.5887096774,"tasnim_acc":0.6692307692,"magerta_acc":0.6680672269,"radiokodak_book_acc":0.4347826087,"vipofilm_acc":0.6923076923,"wikishia_acc":0.7575757576,"voolak_acc":0.6511627907,"farsroid_acc":0.6842105263,"parsiday_acc":0.55,"soft98_acc":0.8,"ninisite_discussion_acc":0.4}
         | 
| 23 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","acc":0.688,"acc_strict":0.688,"donyaeeqtesad_acc":0.6465256798,"isna_acc":0.6640625,"ninisite_article_acc":0.7243243243,"virgool_4_acc":0.7311178248,"khabaronline_acc":0.668,"digiato_acc":0.6764091858,"doctoreto_acc":0.765,"sarzamindownload_acc":0.7058823529,"hamgardi_acc":0.6519174041,"bigbangpage_acc":0.8025477707,"wiki_ahlolbait_acc":0.7368421053,"virgool_3_acc":0.7134328358,"virgool_2_acc":0.7003058104,"virgool_1_acc":0.7025316456,"hamshahrionline_acc":0.6819672131,"tabnak_acc":0.7012448133,"alibaba_acc":0.7189542484,"digikala_mag_acc":0.6753507014,"yjc_acc":0.632183908,"beytoote_acc":0.6703601108,"asriran_acc":0.652173913,"ecoiran_acc":0.6126984127,"hawzah_acc":0.7387640449,"zoomit_acc":0.7300469484,"wikipedia_acc":0.7904761905,"namnak_acc":0.6920980926,"khodro45_acc":0.7279411765,"fidibo_acc":0.6872246696,"newmiind_acc":0.6631944444,"taaghche_acc":0.6858974359,"motamem_acc":0.8,"varzesh3_acc":0.6120401338,"mehrnews_acc":0.6129032258,"tasnim_acc":0.65,"magerta_acc":0.6596638655,"radiokodak_book_acc":0.4782608696,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8787878788,"voolak_acc":0.6511627907,"farsroid_acc":0.6578947368,"parsiday_acc":0.6,"soft98_acc":0.8,"ninisite_discussion_acc":0.4}
         | 
|  | |
| 4 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8839,"acc_strict":0.8839,"donyaeeqtesad_acc":0.8610271903,"isna_acc":0.8359375,"ninisite_article_acc":0.8702702703,"virgool_4_acc":0.9033232628,"khabaronline_acc":0.884,"digiato_acc":0.8705636743,"doctoreto_acc":0.885,"sarzamindownload_acc":0.8562091503,"hamgardi_acc":0.8377581121,"bigbangpage_acc":0.923566879,"wiki_ahlolbait_acc":0.9276315789,"virgool_3_acc":0.9104477612,"virgool_2_acc":0.8837920489,"virgool_1_acc":0.8607594937,"hamshahrionline_acc":0.9114754098,"tabnak_acc":0.887966805,"alibaba_acc":0.9117647059,"digikala_mag_acc":0.9118236473,"yjc_acc":0.867816092,"beytoote_acc":0.91966759,"asriran_acc":0.8792270531,"ecoiran_acc":0.8634920635,"hawzah_acc":0.9269662921,"zoomit_acc":0.9154929577,"wikipedia_acc":0.9428571429,"namnak_acc":0.8583106267,"khodro45_acc":0.8602941176,"fidibo_acc":0.9074889868,"newmiind_acc":0.8020833333,"taaghche_acc":0.8974358974,"motamem_acc":0.9263157895,"varzesh3_acc":0.9096989967,"mehrnews_acc":0.8508064516,"tasnim_acc":0.8307692308,"magerta_acc":0.8403361345,"radiokodak_book_acc":0.8695652174,"vipofilm_acc":1.0,"wikishia_acc":1.0,"voolak_acc":0.8837209302,"farsroid_acc":0.8421052632,"parsiday_acc":0.8833333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.9}
         | 
| 5 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8717,"acc_strict":0.8714,"donyaeeqtesad_acc":0.8700906344,"isna_acc":0.8671875,"ninisite_article_acc":0.8621621622,"virgool_4_acc":0.9033232628,"khabaronline_acc":0.852,"digiato_acc":0.8747390397,"doctoreto_acc":0.9,"sarzamindownload_acc":0.8562091503,"hamgardi_acc":0.8230088496,"bigbangpage_acc":0.898089172,"wiki_ahlolbait_acc":0.8881578947,"virgool_3_acc":0.9104477612,"virgool_2_acc":0.8929663609,"virgool_1_acc":0.8765822785,"hamshahrionline_acc":0.8786885246,"tabnak_acc":0.8755186722,"alibaba_acc":0.9183006536,"digikala_mag_acc":0.8977955912,"yjc_acc":0.8563218391,"beytoote_acc":0.8864265928,"asriran_acc":0.8212560386,"ecoiran_acc":0.8476190476,"hawzah_acc":0.8960674157,"zoomit_acc":0.9084507042,"wikipedia_acc":0.9238095238,"namnak_acc":0.8310626703,"khodro45_acc":0.8382352941,"fidibo_acc":0.9207048458,"newmiind_acc":0.8194444444,"taaghche_acc":0.9038461538,"motamem_acc":0.9368421053,"varzesh3_acc":0.8829431438,"mehrnews_acc":0.8064516129,"tasnim_acc":0.8692307692,"magerta_acc":0.7605042017,"radiokodak_book_acc":0.8260869565,"vipofilm_acc":0.9230769231,"wikishia_acc":0.9393939394,"voolak_acc":0.8372093023,"farsroid_acc":0.7894736842,"parsiday_acc":0.775,"soft98_acc":0.9,"ninisite_discussion_acc":0.8}
         | 
| 6 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8665,"acc_strict":0.7832,"donyaeeqtesad_acc":0.8459214502,"isna_acc":0.8359375,"ninisite_article_acc":0.8594594595,"virgool_4_acc":0.8882175227,"khabaronline_acc":0.896,"digiato_acc":0.8496868476,"doctoreto_acc":0.855,"sarzamindownload_acc":0.8235294118,"hamgardi_acc":0.8200589971,"bigbangpage_acc":0.9171974522,"wiki_ahlolbait_acc":0.9342105263,"virgool_3_acc":0.8656716418,"virgool_2_acc":0.8837920489,"virgool_1_acc":0.8892405063,"hamshahrionline_acc":0.9409836066,"tabnak_acc":0.887966805,"alibaba_acc":0.8529411765,"digikala_mag_acc":0.8817635271,"yjc_acc":0.8103448276,"beytoote_acc":0.8891966759,"asriran_acc":0.8550724638,"ecoiran_acc":0.8126984127,"hawzah_acc":0.9129213483,"zoomit_acc":0.9084507042,"wikipedia_acc":0.9285714286,"namnak_acc":0.8446866485,"khodro45_acc":0.8455882353,"fidibo_acc":0.872246696,"newmiind_acc":0.8125,"taaghche_acc":0.9038461538,"motamem_acc":0.9157894737,"varzesh3_acc":0.8996655518,"mehrnews_acc":0.814516129,"tasnim_acc":0.8461538462,"magerta_acc":0.781512605,"radiokodak_book_acc":0.7826086957,"vipofilm_acc":0.9230769231,"wikishia_acc":0.9696969697,"voolak_acc":0.7674418605,"farsroid_acc":0.7105263158,"parsiday_acc":0.85,"soft98_acc":0.8,"ninisite_discussion_acc":0.9}
         | 
| 7 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8651,"acc_strict":0.8651,"donyaeeqtesad_acc":0.8429003021,"isna_acc":0.80859375,"ninisite_article_acc":0.8756756757,"virgool_4_acc":0.8912386707,"khabaronline_acc":0.864,"digiato_acc":0.8956158664,"doctoreto_acc":0.91,"sarzamindownload_acc":0.8366013072,"hamgardi_acc":0.8200589971,"bigbangpage_acc":0.9044585987,"wiki_ahlolbait_acc":0.8947368421,"virgool_3_acc":0.8626865672,"virgool_2_acc":0.8868501529,"virgool_1_acc":0.8924050633,"hamshahrionline_acc":0.8786885246,"tabnak_acc":0.8838174274,"alibaba_acc":0.8464052288,"digikala_mag_acc":0.8917835671,"yjc_acc":0.8218390805,"beytoote_acc":0.8836565097,"asriran_acc":0.8357487923,"ecoiran_acc":0.8380952381,"hawzah_acc":0.8623595506,"zoomit_acc":0.896713615,"wikipedia_acc":0.9142857143,"namnak_acc":0.8610354223,"khodro45_acc":0.875,"fidibo_acc":0.8546255507,"newmiind_acc":0.8020833333,"taaghche_acc":0.9166666667,"motamem_acc":0.9052631579,"varzesh3_acc":0.8963210702,"mehrnews_acc":0.8387096774,"tasnim_acc":0.8423076923,"magerta_acc":0.781512605,"radiokodak_book_acc":0.7391304348,"vipofilm_acc":1.0,"wikishia_acc":0.9090909091,"voolak_acc":0.7906976744,"farsroid_acc":0.8421052632,"parsiday_acc":0.825,"soft98_acc":0.9,"ninisite_discussion_acc":0.5}
         | 
| 8 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8637863786,"acc_strict":0.8637863786,"donyaeeqtesad_acc":0.8398791541,"isna_acc":0.828125,"ninisite_article_acc":0.8243243243,"virgool_4_acc":0.8851963746,"khabaronline_acc":0.84,"digiato_acc":0.8747390397,"doctoreto_acc":0.895,"sarzamindownload_acc":0.8366013072,"hamgardi_acc":0.802359882,"bigbangpage_acc":0.898089172,"wiki_ahlolbait_acc":0.9407894737,"virgool_3_acc":0.8955223881,"virgool_2_acc":0.8899082569,"virgool_1_acc":0.8892405063,"hamshahrionline_acc":0.8754098361,"tabnak_acc":0.8755186722,"alibaba_acc":0.8426229508,"digikala_mag_acc":0.877755511,"yjc_acc":0.816091954,"beytoote_acc":0.8836565097,"asriran_acc":0.8888888889,"ecoiran_acc":0.8126984127,"hawzah_acc":0.8904494382,"zoomit_acc":0.9084507042,"wikipedia_acc":0.919047619,"namnak_acc":0.8392370572,"khodro45_acc":0.8823529412,"fidibo_acc":0.9030837004,"newmiind_acc":0.8125,"taaghche_acc":0.9423076923,"motamem_acc":0.9157894737,"varzesh3_acc":0.8929765886,"mehrnews_acc":0.8427419355,"tasnim_acc":0.8153846154,"magerta_acc":0.7773109244,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":1.0,"wikishia_acc":0.9696969697,"voolak_acc":0.7441860465,"farsroid_acc":0.7894736842,"parsiday_acc":0.8166666667,"soft98_acc":1.0,"ninisite_discussion_acc":0.9}
         | 
| 9 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8551,"acc_strict":0.8551,"donyaeeqtesad_acc":0.8429003021,"isna_acc":0.828125,"ninisite_article_acc":0.8540540541,"virgool_4_acc":0.8610271903,"khabaronline_acc":0.84,"digiato_acc":0.8830897704,"doctoreto_acc":0.87,"sarzamindownload_acc":0.8758169935,"hamgardi_acc":0.796460177,"bigbangpage_acc":0.8853503185,"wiki_ahlolbait_acc":0.9013157895,"virgool_3_acc":0.871641791,"virgool_2_acc":0.9051987768,"virgool_1_acc":0.8481012658,"hamshahrionline_acc":0.8786885246,"tabnak_acc":0.8713692946,"alibaba_acc":0.8758169935,"digikala_mag_acc":0.879759519,"yjc_acc":0.7988505747,"beytoote_acc":0.8753462604,"asriran_acc":0.8260869565,"ecoiran_acc":0.8031746032,"hawzah_acc":0.8511235955,"zoomit_acc":0.8849765258,"wikipedia_acc":0.9285714286,"namnak_acc":0.8310626703,"khodro45_acc":0.8897058824,"fidibo_acc":0.872246696,"newmiind_acc":0.7881944444,"taaghche_acc":0.8974358974,"motamem_acc":0.9157894737,"varzesh3_acc":0.8762541806,"mehrnews_acc":0.8346774194,"tasnim_acc":0.8269230769,"magerta_acc":0.7941176471,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":0.7692307692,"wikishia_acc":0.9393939394,"voolak_acc":0.8372093023,"farsroid_acc":0.8157894737,"parsiday_acc":0.7583333333,"soft98_acc":0.8,"ninisite_discussion_acc":0.3}
         | 
| 10 | 
             
            {"Model Name":"deepseek-reasoner","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"671000000000","source_type":"Open-Source","acc":0.825165033,"acc_strict":0.825165033,"donyaeeqtesad_acc":0.8247734139,"isna_acc":0.8046875,"ninisite_article_acc":0.8594594595,"virgool_4_acc":0.8580060423,"khabaronline_acc":0.78,"digiato_acc":0.8267223382,"doctoreto_acc":0.835,"sarzamindownload_acc":0.7908496732,"hamgardi_acc":0.808259587,"bigbangpage_acc":0.9044585987,"wiki_ahlolbait_acc":0.9006622517,"virgool_3_acc":0.8268656716,"virgool_2_acc":0.8348623853,"virgool_1_acc":0.7911392405,"hamshahrionline_acc":0.8651315789,"tabnak_acc":0.8215767635,"alibaba_acc":0.8169934641,"digikala_mag_acc":0.8336673347,"yjc_acc":0.7873563218,"beytoote_acc":0.8310249307,"asriran_acc":0.8212560386,"ecoiran_acc":0.7523809524,"hawzah_acc":0.8735955056,"zoomit_acc":0.8450704225,"wikipedia_acc":0.9,"namnak_acc":0.8337874659,"khodro45_acc":0.8088235294,"fidibo_acc":0.845814978,"newmiind_acc":0.7604166667,"taaghche_acc":0.891025641,"motamem_acc":0.8947368421,"varzesh3_acc":0.8093645485,"mehrnews_acc":0.7782258065,"tasnim_acc":0.8115384615,"magerta_acc":0.7647058824,"radiokodak_book_acc":0.6086956522,"vipofilm_acc":0.9230769231,"wikishia_acc":0.9393939394,"voolak_acc":0.8372093023,"farsroid_acc":0.7368421053,"parsiday_acc":0.7583333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.7}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.8143,"acc_strict":0.8143,"donyaeeqtesad_acc":0.7975830816,"isna_acc":0.77734375,"ninisite_article_acc":0.8,"virgool_4_acc":0.833836858,"khabaronline_acc":0.796,"digiato_acc":0.8037578288,"doctoreto_acc":0.82,"sarzamindownload_acc":0.7712418301,"hamgardi_acc":0.7669616519,"bigbangpage_acc":0.8598726115,"wiki_ahlolbait_acc":0.8947368421,"virgool_3_acc":0.8298507463,"virgool_2_acc":0.8409785933,"virgool_1_acc":0.8196202532,"hamshahrionline_acc":0.8557377049,"tabnak_acc":0.8215767635,"alibaba_acc":0.8202614379,"digikala_mag_acc":0.8176352705,"yjc_acc":0.8045977011,"beytoote_acc":0.811634349,"asriran_acc":0.7874396135,"ecoiran_acc":0.7682539683,"hawzah_acc":0.8511235955,"zoomit_acc":0.8474178404,"wikipedia_acc":0.8952380952,"namnak_acc":0.7847411444,"khodro45_acc":0.8382352941,"fidibo_acc":0.845814978,"newmiind_acc":0.7708333333,"taaghche_acc":0.8525641026,"motamem_acc":0.9157894737,"varzesh3_acc":0.8394648829,"mehrnews_acc":0.7459677419,"tasnim_acc":0.8230769231,"magerta_acc":0.7478991597,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":1.0,"wikishia_acc":1.0,"voolak_acc":0.7906976744,"farsroid_acc":0.7105263158,"parsiday_acc":0.7416666667,"soft98_acc":0.9,"ninisite_discussion_acc":0.6}
         | 
| 13 | 
             
            {"Model Name":"c4ai-command-a-03-2025","thinking_method":"β","model_url":"https_google.com","parameters_count":"111000000000","source_type":"Open-Source","acc":0.798859772,"acc_strict":0.7983596719,"donyaeeqtesad_acc":0.7673716012,"isna_acc":0.76953125,"ninisite_article_acc":0.7696476965,"virgool_4_acc":0.8398791541,"khabaronline_acc":0.78,"digiato_acc":0.7870563674,"doctoreto_acc":0.82,"sarzamindownload_acc":0.7712418301,"hamgardi_acc":0.7610619469,"bigbangpage_acc":0.8789808917,"wiki_ahlolbait_acc":0.8486842105,"virgool_3_acc":0.8119402985,"virgool_2_acc":0.8226299694,"virgool_1_acc":0.8037974684,"hamshahrionline_acc":0.8557377049,"tabnak_acc":0.8298755187,"alibaba_acc":0.8562091503,"digikala_mag_acc":0.8152610442,"yjc_acc":0.7471264368,"beytoote_acc":0.8005540166,"asriran_acc":0.7922705314,"ecoiran_acc":0.7333333333,"hawzah_acc":0.8342696629,"zoomit_acc":0.8427230047,"wikipedia_acc":0.9095238095,"namnak_acc":0.7738419619,"khodro45_acc":0.8088235294,"fidibo_acc":0.845814978,"newmiind_acc":0.7222222222,"taaghche_acc":0.8397435897,"motamem_acc":0.8947368421,"varzesh3_acc":0.7993311037,"mehrnews_acc":0.7338709677,"tasnim_acc":0.7730769231,"magerta_acc":0.6974789916,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8484848485,"voolak_acc":0.7441860465,"farsroid_acc":0.6578947368,"parsiday_acc":0.7166666667,"soft98_acc":0.8,"ninisite_discussion_acc":0.6}
         | 
| 14 | 
             
            {"Model Name":"Llama-3.3-70B-Instruct","thinking_method":"β","model_url":"https_google.com","parameters_count":"70600000000","source_type":"Open-Source","acc":0.7956,"acc_strict":0.1123,"donyaeeqtesad_acc":0.7764350453,"isna_acc":0.76171875,"ninisite_article_acc":0.772972973,"virgool_4_acc":0.8549848943,"khabaronline_acc":0.78,"digiato_acc":0.7954070981,"doctoreto_acc":0.755,"sarzamindownload_acc":0.7385620915,"hamgardi_acc":0.7492625369,"bigbangpage_acc":0.8407643312,"wiki_ahlolbait_acc":0.8421052632,"virgool_3_acc":0.8029850746,"virgool_2_acc":0.8287461774,"virgool_1_acc":0.8259493671,"hamshahrionline_acc":0.862295082,"tabnak_acc":0.8257261411,"alibaba_acc":0.8366013072,"digikala_mag_acc":0.8076152305,"yjc_acc":0.7356321839,"beytoote_acc":0.7922437673,"asriran_acc":0.7874396135,"ecoiran_acc":0.7142857143,"hawzah_acc":0.845505618,"zoomit_acc":0.8403755869,"wikipedia_acc":0.9047619048,"namnak_acc":0.7874659401,"khodro45_acc":0.7941176471,"fidibo_acc":0.8414096916,"newmiind_acc":0.7465277778,"taaghche_acc":0.8076923077,"motamem_acc":0.8947368421,"varzesh3_acc":0.7959866221,"mehrnews_acc":0.7419354839,"tasnim_acc":0.7346153846,"magerta_acc":0.6848739496,"radiokodak_book_acc":0.6086956522,"vipofilm_acc":0.8461538462,"wikishia_acc":0.8787878788,"voolak_acc":0.7906976744,"farsroid_acc":0.6578947368,"parsiday_acc":0.7583333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.5}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https_google.com","parameters_count":"109000000000","source_type":"Open-Source","acc":0.7814,"acc_strict":0.1472,"donyaeeqtesad_acc":0.7945619335,"isna_acc":0.7421875,"ninisite_article_acc":0.7486486486,"virgool_4_acc":0.8157099698,"khabaronline_acc":0.756,"digiato_acc":0.7933194154,"doctoreto_acc":0.8,"sarzamindownload_acc":0.7189542484,"hamgardi_acc":0.7197640118,"bigbangpage_acc":0.8407643312,"wiki_ahlolbait_acc":0.8421052632,"virgool_3_acc":0.7850746269,"virgool_2_acc":0.8073394495,"virgool_1_acc":0.7784810127,"hamshahrionline_acc":0.8557377049,"tabnak_acc":0.8132780083,"alibaba_acc":0.8006535948,"digikala_mag_acc":0.7715430862,"yjc_acc":0.7471264368,"beytoote_acc":0.7700831025,"asriran_acc":0.7777777778,"ecoiran_acc":0.7523809524,"hawzah_acc":0.7949438202,"zoomit_acc":0.8192488263,"wikipedia_acc":0.8428571429,"namnak_acc":0.7820163488,"khodro45_acc":0.8088235294,"fidibo_acc":0.7929515419,"newmiind_acc":0.6979166667,"taaghche_acc":0.8269230769,"motamem_acc":0.8842105263,"varzesh3_acc":0.8160535117,"mehrnews_acc":0.7258064516,"tasnim_acc":0.7769230769,"magerta_acc":0.7100840336,"radiokodak_book_acc":0.6086956522,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8484848485,"voolak_acc":0.7441860465,"farsroid_acc":0.7631578947,"parsiday_acc":0.6916666667,"soft98_acc":0.8,"ninisite_discussion_acc":0.6}
         | 
| 16 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7712,"acc_strict":0.7712,"donyaeeqtesad_acc":0.7703927492,"isna_acc":0.75390625,"ninisite_article_acc":0.7648648649,"virgool_4_acc":0.8247734139,"khabaronline_acc":0.76,"digiato_acc":0.7745302714,"doctoreto_acc":0.785,"sarzamindownload_acc":0.7581699346,"hamgardi_acc":0.6784660767,"bigbangpage_acc":0.8407643312,"wiki_ahlolbait_acc":0.8223684211,"virgool_3_acc":0.7910447761,"virgool_2_acc":0.7920489297,"virgool_1_acc":0.7943037975,"hamshahrionline_acc":0.8295081967,"tabnak_acc":0.7634854772,"alibaba_acc":0.7973856209,"digikala_mag_acc":0.8056112224,"yjc_acc":0.724137931,"beytoote_acc":0.7783933518,"asriran_acc":0.7777777778,"ecoiran_acc":0.7079365079,"hawzah_acc":0.7724719101,"zoomit_acc":0.8098591549,"wikipedia_acc":0.8761904762,"namnak_acc":0.7547683924,"khodro45_acc":0.7941176471,"fidibo_acc":0.7841409692,"newmiind_acc":0.6875,"taaghche_acc":0.8269230769,"motamem_acc":0.8631578947,"varzesh3_acc":0.7926421405,"mehrnews_acc":0.7056451613,"tasnim_acc":0.7076923077,"magerta_acc":0.6890756303,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.8461538462,"wikishia_acc":0.8181818182,"voolak_acc":0.6279069767,"farsroid_acc":0.6578947368,"parsiday_acc":0.7083333333,"soft98_acc":0.7,"ninisite_discussion_acc":0.5}
         | 
| 17 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","acc":0.7654,"acc_strict":0.7653,"donyaeeqtesad_acc":0.749244713,"isna_acc":0.75,"ninisite_article_acc":0.7621621622,"virgool_4_acc":0.7824773414,"khabaronline_acc":0.724,"digiato_acc":0.8037578288,"doctoreto_acc":0.8,"sarzamindownload_acc":0.7450980392,"hamgardi_acc":0.6991150442,"bigbangpage_acc":0.8025477707,"wiki_ahlolbait_acc":0.8157894737,"virgool_3_acc":0.8029850746,"virgool_2_acc":0.8073394495,"virgool_1_acc":0.7943037975,"hamshahrionline_acc":0.8,"tabnak_acc":0.7634854772,"alibaba_acc":0.8039215686,"digikala_mag_acc":0.7875751503,"yjc_acc":0.6896551724,"beytoote_acc":0.7783933518,"asriran_acc":0.7632850242,"ecoiran_acc":0.6793650794,"hawzah_acc":0.7724719101,"zoomit_acc":0.8215962441,"wikipedia_acc":0.8523809524,"namnak_acc":0.7520435967,"khodro45_acc":0.8088235294,"fidibo_acc":0.7665198238,"newmiind_acc":0.6909722222,"taaghche_acc":0.7564102564,"motamem_acc":0.8736842105,"varzesh3_acc":0.762541806,"mehrnews_acc":0.689516129,"tasnim_acc":0.7192307692,"magerta_acc":0.7268907563,"radiokodak_book_acc":0.5217391304,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8484848485,"voolak_acc":0.6744186047,"farsroid_acc":0.6578947368,"parsiday_acc":0.675,"soft98_acc":0.7,"ninisite_discussion_acc":0.7}
         | 
| 18 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","acc":0.7643,"acc_strict":0.7643,"donyaeeqtesad_acc":0.7039274924,"isna_acc":0.73828125,"ninisite_article_acc":0.7567567568,"virgool_4_acc":0.8096676737,"khabaronline_acc":0.688,"digiato_acc":0.7703549061,"doctoreto_acc":0.84,"sarzamindownload_acc":0.7712418301,"hamgardi_acc":0.7256637168,"bigbangpage_acc":0.7898089172,"wiki_ahlolbait_acc":0.7697368421,"virgool_3_acc":0.8149253731,"virgool_2_acc":0.8195718654,"virgool_1_acc":0.7879746835,"hamshahrionline_acc":0.7573770492,"tabnak_acc":0.7136929461,"alibaba_acc":0.7712418301,"digikala_mag_acc":0.8016032064,"yjc_acc":0.7011494253,"beytoote_acc":0.7950138504,"asriran_acc":0.7246376812,"ecoiran_acc":0.7079365079,"hawzah_acc":0.7556179775,"zoomit_acc":0.7957746479,"wikipedia_acc":0.9,"namnak_acc":0.7547683924,"khodro45_acc":0.8014705882,"fidibo_acc":0.7885462555,"newmiind_acc":0.7465277778,"taaghche_acc":0.7820512821,"motamem_acc":0.8631578947,"varzesh3_acc":0.7257525084,"mehrnews_acc":0.6814516129,"tasnim_acc":0.7269230769,"magerta_acc":0.7731092437,"radiokodak_book_acc":0.5652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8787878788,"voolak_acc":0.7674418605,"farsroid_acc":0.6842105263,"parsiday_acc":0.6916666667,"soft98_acc":0.9,"ninisite_discussion_acc":0.3}
         | 
| 19 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"27400000000","source_type":"Open-Source","acc":0.7628,"acc_strict":0.7628,"donyaeeqtesad_acc":0.6978851964,"isna_acc":0.7265625,"ninisite_article_acc":0.7621621622,"virgool_4_acc":0.8187311178,"khabaronline_acc":0.74,"digiato_acc":0.7661795407,"doctoreto_acc":0.78,"sarzamindownload_acc":0.6993464052,"hamgardi_acc":0.7109144543,"bigbangpage_acc":0.821656051,"wiki_ahlolbait_acc":0.8026315789,"virgool_3_acc":0.7940298507,"virgool_2_acc":0.755351682,"virgool_1_acc":0.7784810127,"hamshahrionline_acc":0.8229508197,"tabnak_acc":0.8174273859,"alibaba_acc":0.7843137255,"digikala_mag_acc":0.7975951904,"yjc_acc":0.7126436782,"beytoote_acc":0.7534626039,"asriran_acc":0.7391304348,"ecoiran_acc":0.7079365079,"hawzah_acc":0.7752808989,"zoomit_acc":0.7957746479,"wikipedia_acc":0.8428571429,"namnak_acc":0.7493188011,"khodro45_acc":0.7867647059,"fidibo_acc":0.8237885463,"newmiind_acc":0.6909722222,"taaghche_acc":0.7820512821,"motamem_acc":0.8315789474,"varzesh3_acc":0.7993311037,"mehrnews_acc":0.6975806452,"tasnim_acc":0.7307692308,"magerta_acc":0.6722689076,"radiokodak_book_acc":0.6956521739,"vipofilm_acc":0.8461538462,"wikishia_acc":0.9393939394,"voolak_acc":0.6976744186,"farsroid_acc":0.6315789474,"parsiday_acc":0.7,"soft98_acc":0.8,"ninisite_discussion_acc":0.7}
         | 
| 20 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7598,"acc_strict":0.7598,"donyaeeqtesad_acc":0.749244713,"isna_acc":0.71484375,"ninisite_article_acc":0.7351351351,"virgool_4_acc":0.8006042296,"khabaronline_acc":0.736,"digiato_acc":0.7599164927,"doctoreto_acc":0.775,"sarzamindownload_acc":0.6535947712,"hamgardi_acc":0.7197640118,"bigbangpage_acc":0.7961783439,"wiki_ahlolbait_acc":0.8289473684,"virgool_3_acc":0.7492537313,"virgool_2_acc":0.7828746177,"virgool_1_acc":0.8006329114,"hamshahrionline_acc":0.8131147541,"tabnak_acc":0.7427385892,"alibaba_acc":0.7810457516,"digikala_mag_acc":0.7615230461,"yjc_acc":0.7643678161,"beytoote_acc":0.7783933518,"asriran_acc":0.7536231884,"ecoiran_acc":0.6952380952,"hawzah_acc":0.7668539326,"zoomit_acc":0.7957746479,"wikipedia_acc":0.8761904762,"namnak_acc":0.7765667575,"khodro45_acc":0.7573529412,"fidibo_acc":0.7621145374,"newmiind_acc":0.6909722222,"taaghche_acc":0.7820512821,"motamem_acc":0.8736842105,"varzesh3_acc":0.8060200669,"mehrnews_acc":0.6733870968,"tasnim_acc":0.75,"magerta_acc":0.6764705882,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.8461538462,"wikishia_acc":0.8484848485,"voolak_acc":0.7441860465,"farsroid_acc":0.7631578947,"parsiday_acc":0.7083333333,"soft98_acc":0.8,"ninisite_discussion_acc":0.4}
         | 
| 21 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https_google.com","parameters_count":"104000000000","source_type":"Open-Source","acc":0.7364,"acc_strict":0.7364,"donyaeeqtesad_acc":0.752265861,"isna_acc":0.67578125,"ninisite_article_acc":0.7054054054,"virgool_4_acc":0.746223565,"khabaronline_acc":0.724,"digiato_acc":0.7223382046,"doctoreto_acc":0.7,"sarzamindownload_acc":0.6993464052,"hamgardi_acc":0.7020648968,"bigbangpage_acc":0.8089171975,"wiki_ahlolbait_acc":0.8486842105,"virgool_3_acc":0.7194029851,"virgool_2_acc":0.7339449541,"virgool_1_acc":0.7246835443,"hamshahrionline_acc":0.8262295082,"tabnak_acc":0.7178423237,"alibaba_acc":0.7712418301,"digikala_mag_acc":0.7715430862,"yjc_acc":0.7183908046,"beytoote_acc":0.7479224377,"asriran_acc":0.768115942,"ecoiran_acc":0.6698412698,"hawzah_acc":0.7415730337,"zoomit_acc":0.79342723,"wikipedia_acc":0.819047619,"namnak_acc":0.7220708447,"khodro45_acc":0.75,"fidibo_acc":0.7665198238,"newmiind_acc":0.6631944444,"taaghche_acc":0.7820512821,"motamem_acc":0.8631578947,"varzesh3_acc":0.7525083612,"mehrnews_acc":0.6653225806,"tasnim_acc":0.75,"magerta_acc":0.6134453782,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8787878788,"voolak_acc":0.6511627907,"farsroid_acc":0.5,"parsiday_acc":0.7083333333,"soft98_acc":0.9,"ninisite_discussion_acc":0.7}
         | 
| 22 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.731,"acc_strict":0.7309,"donyaeeqtesad_acc":0.664652568,"isna_acc":0.69921875,"ninisite_article_acc":0.7540540541,"virgool_4_acc":0.7764350453,"khabaronline_acc":0.712,"digiato_acc":0.7265135699,"doctoreto_acc":0.78,"sarzamindownload_acc":0.7124183007,"hamgardi_acc":0.6814159292,"bigbangpage_acc":0.7770700637,"wiki_ahlolbait_acc":0.8157894737,"virgool_3_acc":0.7701492537,"virgool_2_acc":0.752293578,"virgool_1_acc":0.7784810127,"hamshahrionline_acc":0.7442622951,"tabnak_acc":0.7302904564,"alibaba_acc":0.7679738562,"digikala_mag_acc":0.7855711423,"yjc_acc":0.6781609195,"beytoote_acc":0.7423822715,"asriran_acc":0.6811594203,"ecoiran_acc":0.6857142857,"hawzah_acc":0.6882022472,"zoomit_acc":0.7417840376,"wikipedia_acc":0.8333333333,"namnak_acc":0.7166212534,"khodro45_acc":0.7720588235,"fidibo_acc":0.7400881057,"newmiind_acc":0.6736111111,"taaghche_acc":0.7179487179,"motamem_acc":0.8210526316,"varzesh3_acc":0.6956521739,"mehrnews_acc":0.689516129,"tasnim_acc":0.7269230769,"magerta_acc":0.6974789916,"radiokodak_book_acc":0.5217391304,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8787878788,"voolak_acc":0.6511627907,"farsroid_acc":0.5263157895,"parsiday_acc":0.675,"soft98_acc":0.7,"ninisite_discussion_acc":0.5}
         | 
| 23 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","acc":0.7160432086,"acc_strict":0.7160432086,"donyaeeqtesad_acc":0.6888217523,"isna_acc":0.69140625,"ninisite_article_acc":0.7,"virgool_4_acc":0.7311178248,"khabaronline_acc":0.712,"digiato_acc":0.7181628392,"doctoreto_acc":0.745,"sarzamindownload_acc":0.6013071895,"hamgardi_acc":0.6755162242,"bigbangpage_acc":0.7770700637,"wiki_ahlolbait_acc":0.8684210526,"virgool_3_acc":0.7194029851,"virgool_2_acc":0.7064220183,"virgool_1_acc":0.7056962025,"hamshahrionline_acc":0.7803278689,"tabnak_acc":0.6887966805,"alibaba_acc":0.7483660131,"digikala_mag_acc":0.7434869739,"yjc_acc":0.6724137931,"beytoote_acc":0.728531856,"asriran_acc":0.7487922705,"ecoiran_acc":0.6761904762,"hawzah_acc":0.7584269663,"zoomit_acc":0.7558685446,"wikipedia_acc":0.780952381,"namnak_acc":0.7002724796,"khodro45_acc":0.7279411765,"fidibo_acc":0.7665198238,"newmiind_acc":0.6202090592,"taaghche_acc":0.7628205128,"motamem_acc":0.8404255319,"varzesh3_acc":0.7324414716,"mehrnews_acc":0.6169354839,"tasnim_acc":0.6923076923,"magerta_acc":0.6680672269,"radiokodak_book_acc":0.5652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.7878787879,"voolak_acc":0.6511627907,"farsroid_acc":0.7105263158,"parsiday_acc":0.575,"soft98_acc":0.9,"ninisite_discussion_acc":0.3}
         | 
| 24 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","acc":0.7094,"acc_strict":0.7094,"donyaeeqtesad_acc":0.6586102719,"isna_acc":0.65625,"ninisite_article_acc":0.7243243243,"virgool_4_acc":0.7643504532,"khabaronline_acc":0.704,"digiato_acc":0.7369519833,"doctoreto_acc":0.76,"sarzamindownload_acc":0.6797385621,"hamgardi_acc":0.6666666667,"bigbangpage_acc":0.7515923567,"wiki_ahlolbait_acc":0.7631578947,"virgool_3_acc":0.7223880597,"virgool_2_acc":0.7584097859,"virgool_1_acc":0.7183544304,"hamshahrionline_acc":0.7213114754,"tabnak_acc":0.7219917012,"alibaba_acc":0.6830065359,"digikala_mag_acc":0.7354709419,"yjc_acc":0.6206896552,"beytoote_acc":0.7146814404,"asriran_acc":0.7198067633,"ecoiran_acc":0.6603174603,"hawzah_acc":0.702247191,"zoomit_acc":0.7323943662,"wikipedia_acc":0.7714285714,"namnak_acc":0.7329700272,"khodro45_acc":0.7352941176,"fidibo_acc":0.718061674,"newmiind_acc":0.6493055556,"taaghche_acc":0.7564102564,"motamem_acc":0.8210526316,"varzesh3_acc":0.7157190635,"mehrnews_acc":0.6088709677,"tasnim_acc":0.6576923077,"magerta_acc":0.6302521008,"radiokodak_book_acc":0.652173913,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8787878788,"voolak_acc":0.6976744186,"farsroid_acc":0.7368421053,"parsiday_acc":0.6583333333,"soft98_acc":0.8,"ninisite_discussion_acc":0.8}
         | 
| 25 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","acc":0.6962,"acc_strict":0.6962,"donyaeeqtesad_acc":0.6435045317,"isna_acc":0.67578125,"ninisite_article_acc":0.7054054054,"virgool_4_acc":0.7915407855,"khabaronline_acc":0.648,"digiato_acc":0.7035490605,"doctoreto_acc":0.79,"sarzamindownload_acc":0.7450980392,"hamgardi_acc":0.6902654867,"bigbangpage_acc":0.7579617834,"wiki_ahlolbait_acc":0.6710526316,"virgool_3_acc":0.7671641791,"virgool_2_acc":0.7247706422,"virgool_1_acc":0.7278481013,"hamshahrionline_acc":0.6819672131,"tabnak_acc":0.6680497925,"alibaba_acc":0.7418300654,"digikala_mag_acc":0.7114228457,"yjc_acc":0.6781609195,"beytoote_acc":0.7119113573,"asriran_acc":0.6763285024,"ecoiran_acc":0.6349206349,"hawzah_acc":0.6685393258,"zoomit_acc":0.7042253521,"wikipedia_acc":0.8047619048,"namnak_acc":0.659400545,"khodro45_acc":0.7058823529,"fidibo_acc":0.6960352423,"newmiind_acc":0.6875,"taaghche_acc":0.6538461538,"motamem_acc":0.7684210526,"varzesh3_acc":0.6454849498,"mehrnews_acc":0.6532258065,"tasnim_acc":0.6307692308,"magerta_acc":0.6512605042,"radiokodak_book_acc":0.5652173913,"vipofilm_acc":0.6923076923,"wikishia_acc":0.7575757576,"voolak_acc":0.6046511628,"farsroid_acc":0.6578947368,"parsiday_acc":0.65,"soft98_acc":0.7,"ninisite_discussion_acc":0.4}
         | 
| 26 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","acc":0.6958,"acc_strict":0.6958,"donyaeeqtesad_acc":0.6495468278,"isna_acc":0.62890625,"ninisite_article_acc":0.6972972973,"virgool_4_acc":0.7069486405,"khabaronline_acc":0.652,"digiato_acc":0.7202505219,"doctoreto_acc":0.77,"sarzamindownload_acc":0.614379085,"hamgardi_acc":0.6430678466,"bigbangpage_acc":0.7579617834,"wiki_ahlolbait_acc":0.7631578947,"virgool_3_acc":0.7373134328,"virgool_2_acc":0.7155963303,"virgool_1_acc":0.7278481013,"hamshahrionline_acc":0.7278688525,"tabnak_acc":0.6970954357,"alibaba_acc":0.7254901961,"digikala_mag_acc":0.7074148297,"yjc_acc":0.6379310345,"beytoote_acc":0.6842105263,"asriran_acc":0.6859903382,"ecoiran_acc":0.653968254,"hawzah_acc":0.7078651685,"zoomit_acc":0.7676056338,"wikipedia_acc":0.8142857143,"namnak_acc":0.6621253406,"khodro45_acc":0.7647058824,"fidibo_acc":0.731277533,"newmiind_acc":0.6597222222,"taaghche_acc":0.6987179487,"motamem_acc":0.8105263158,"varzesh3_acc":0.6220735786,"mehrnews_acc":0.625,"tasnim_acc":0.6692307692,"magerta_acc":0.6596638655,"radiokodak_book_acc":0.5652173913,"vipofilm_acc":0.9230769231,"wikishia_acc":0.8787878788,"voolak_acc":0.6279069767,"farsroid_acc":0.6052631579,"parsiday_acc":0.5666666667,"soft98_acc":0.9,"ninisite_discussion_acc":0.7}
         | 
| 27 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","acc":0.6894,"acc_strict":0.6894,"donyaeeqtesad_acc":0.670694864,"isna_acc":0.63671875,"ninisite_article_acc":0.6945945946,"virgool_4_acc":0.7039274924,"khabaronline_acc":0.664,"digiato_acc":0.6826722338,"doctoreto_acc":0.755,"sarzamindownload_acc":0.6339869281,"hamgardi_acc":0.6342182891,"bigbangpage_acc":0.7452229299,"wiki_ahlolbait_acc":0.7697368421,"virgool_3_acc":0.7014925373,"virgool_2_acc":0.7125382263,"virgool_1_acc":0.7341772152,"hamshahrionline_acc":0.7278688525,"tabnak_acc":0.6307053942,"alibaba_acc":0.7647058824,"digikala_mag_acc":0.7174348697,"yjc_acc":0.5804597701,"beytoote_acc":0.6814404432,"asriran_acc":0.6811594203,"ecoiran_acc":0.6158730159,"hawzah_acc":0.6994382022,"zoomit_acc":0.7441314554,"wikipedia_acc":0.8333333333,"namnak_acc":0.659400545,"khodro45_acc":0.7058823529,"fidibo_acc":0.7268722467,"newmiind_acc":0.6527777778,"taaghche_acc":0.7051282051,"motamem_acc":0.8526315789,"varzesh3_acc":0.6789297659,"mehrnews_acc":0.5887096774,"tasnim_acc":0.6692307692,"magerta_acc":0.6680672269,"radiokodak_book_acc":0.4347826087,"vipofilm_acc":0.6923076923,"wikishia_acc":0.7575757576,"voolak_acc":0.6511627907,"farsroid_acc":0.6842105263,"parsiday_acc":0.55,"soft98_acc":0.8,"ninisite_discussion_acc":0.4}
         | 
| 28 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","acc":0.688,"acc_strict":0.688,"donyaeeqtesad_acc":0.6465256798,"isna_acc":0.6640625,"ninisite_article_acc":0.7243243243,"virgool_4_acc":0.7311178248,"khabaronline_acc":0.668,"digiato_acc":0.6764091858,"doctoreto_acc":0.765,"sarzamindownload_acc":0.7058823529,"hamgardi_acc":0.6519174041,"bigbangpage_acc":0.8025477707,"wiki_ahlolbait_acc":0.7368421053,"virgool_3_acc":0.7134328358,"virgool_2_acc":0.7003058104,"virgool_1_acc":0.7025316456,"hamshahrionline_acc":0.6819672131,"tabnak_acc":0.7012448133,"alibaba_acc":0.7189542484,"digikala_mag_acc":0.6753507014,"yjc_acc":0.632183908,"beytoote_acc":0.6703601108,"asriran_acc":0.652173913,"ecoiran_acc":0.6126984127,"hawzah_acc":0.7387640449,"zoomit_acc":0.7300469484,"wikipedia_acc":0.7904761905,"namnak_acc":0.6920980926,"khodro45_acc":0.7279411765,"fidibo_acc":0.6872246696,"newmiind_acc":0.6631944444,"taaghche_acc":0.6858974359,"motamem_acc":0.8,"varzesh3_acc":0.6120401338,"mehrnews_acc":0.6129032258,"tasnim_acc":0.65,"magerta_acc":0.6596638655,"radiokodak_book_acc":0.4782608696,"vipofilm_acc":0.7692307692,"wikishia_acc":0.8787878788,"voolak_acc":0.6511627907,"farsroid_acc":0.6578947368,"parsiday_acc":0.6,"soft98_acc":0.8,"ninisite_discussion_acc":0.4}
         | 
    	
        leaderboard/boards_data/persian_nlg.jsonl
    CHANGED
    
    | @@ -3,6 +3,7 @@ | |
| 3 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2438951227,"question-generation_PersianQA_rougeL_recall":0.3687301621,"question-generation_PersianQA_rougeL_f1_score":0.2816187853},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1979467916,"translation-en2fa_en2fa_epoque_bleu":0.4460981632,"translation-en2fa_en2fa_mizan_bleu":0.1745376389,"translation-en2fa_en2fa_quran_bleu":0.137406774,"translation-en2fa_en2fa_sahife_bleu":0.091586235,"translation-en2fa_en2fa_nahj_bleu":0.0490159552,"translation-en2fa_en2fa_tep_bleu":0.072776086},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.171454009,"summarization_SamSUM-fa_rougeL_recall":0.3692597258,"summarization_SamSUM-fa_rougeL_f1_score":0.2248722593},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2389011537,"translation-fa2en_fa2en_tep_bleu":0.1431825698,"translation-fa2en_fa2en_mizan_bleu":0.2056729072,"translation-fa2en_fa2en_quran_bleu":0.1776018574,"translation-fa2en_fa2en_epoque_bleu":0.4842161688,"translation-fa2en_fa2en_nahj_bleu":0.0886384727,"translation-fa2en_fa2en_sahife_bleu":0.1045044839},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.143500711,"translation-ar2fa_ar2fa_sahife_bleu":0.1221294429,"translation-ar2fa_ar2fa_nahj_bleu":0.069521493,"translation-ar2fa_ar2fa_quran_bleu":0.235152236},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1156493376,"summarization_PnSummary_rougeL_recall":0.403347998,"summarization_PnSummary_rougeL_f1_score":0.1750055649},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0689994984,"translation-fa2ar_fa2ar_nahj_bleu":0.0397020785,"translation-fa2ar_fa2ar_sahife_bleu":0.0751264317,"translation-fa2ar_fa2ar_quran_bleu":0.092169985},"nlg_score":0.1901206806}
         | 
| 4 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2275858051,"question-generation_PersianQA_rougeL_recall":0.3654754607,"question-generation_PersianQA_rougeL_f1_score":0.2679025722},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.2099911906,"translation-en2fa_en2fa_epoque_bleu":0.4805793807,"translation-en2fa_en2fa_mizan_bleu":0.1904867707,"translation-en2fa_en2fa_quran_bleu":0.1412389522,"translation-en2fa_en2fa_sahife_bleu":0.0861059288,"translation-en2fa_en2fa_nahj_bleu":0.0528683421,"translation-en2fa_en2fa_tep_bleu":0.0688528109},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.165108522,"summarization_SamSUM-fa_rougeL_recall":0.3982318891,"summarization_SamSUM-fa_rougeL_f1_score":0.2240082992},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.234039473,"translation-fa2en_fa2en_tep_bleu":0.1597644653,"translation-fa2en_fa2en_mizan_bleu":0.1946759365,"translation-fa2en_fa2en_quran_bleu":0.1638938233,"translation-fa2en_fa2en_epoque_bleu":0.474760879,"translation-fa2en_fa2en_nahj_bleu":0.0825458621,"translation-fa2en_fa2en_sahife_bleu":0.0952634494},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1542520457,"translation-ar2fa_ar2fa_sahife_bleu":0.1283925803,"translation-ar2fa_ar2fa_nahj_bleu":0.0660434951,"translation-ar2fa_ar2fa_quran_bleu":0.2639096342},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1134979628,"summarization_PnSummary_rougeL_recall":0.3909794734,"summarization_PnSummary_rougeL_f1_score":0.1716841943},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0656699851,"translation-fa2ar_fa2ar_nahj_bleu":0.0347167128,"translation-fa2ar_fa2ar_sahife_bleu":0.0732417084,"translation-fa2ar_fa2ar_quran_bleu":0.0890515341},"nlg_score":0.18964968}
         | 
| 5 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https_google.com","parameters_count":"104000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2149535143,"question-generation_PersianQA_rougeL_recall":0.3019561885,"question-generation_PersianQA_rougeL_f1_score":0.2405115465},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.2018158808,"translation-en2fa_en2fa_epoque_bleu":0.4332944681,"translation-en2fa_en2fa_mizan_bleu":0.1925182751,"translation-en2fa_en2fa_quran_bleu":0.1530925462,"translation-en2fa_en2fa_sahife_bleu":0.1026499453,"translation-en2fa_en2fa_nahj_bleu":0.051968827,"translation-en2fa_en2fa_tep_bleu":0.0708487287},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1591262985,"summarization_SamSUM-fa_rougeL_recall":0.4163090512,"summarization_SamSUM-fa_rougeL_f1_score":0.2208876443},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2337569687,"translation-fa2en_fa2en_tep_bleu":0.1386371644,"translation-fa2en_fa2en_mizan_bleu":0.2129637469,"translation-fa2en_fa2en_quran_bleu":0.1702102457,"translation-fa2en_fa2en_epoque_bleu":0.478211182,"translation-fa2en_fa2en_nahj_bleu":0.083013513,"translation-fa2en_fa2en_sahife_bleu":0.072000292},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1414109272,"translation-ar2fa_ar2fa_sahife_bleu":0.136408042,"translation-ar2fa_ar2fa_nahj_bleu":0.0653197648,"translation-ar2fa_ar2fa_quran_bleu":0.2187004167},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1227039295,"summarization_PnSummary_rougeL_recall":0.4315497639,"summarization_PnSummary_rougeL_f1_score":0.1856517383},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0922998074,"translation-fa2ar_fa2ar_nahj_bleu":0.0511154919,"translation-fa2ar_fa2ar_sahife_bleu":0.0589808221,"translation-fa2ar_fa2ar_quran_bleu":0.1668031083},"nlg_score":0.1880477876}
         | 
|  | |
| 6 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1942536013,"question-generation_PersianQA_rougeL_recall":0.3435531442,"question-generation_PersianQA_rougeL_f1_score":0.2369359061},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.2014428857,"translation-en2fa_en2fa_epoque_bleu":0.4710672433,"translation-en2fa_en2fa_mizan_bleu":0.1830885263,"translation-en2fa_en2fa_quran_bleu":0.1141518863,"translation-en2fa_en2fa_sahife_bleu":0.0806159411,"translation-en2fa_en2fa_nahj_bleu":0.0504089542,"translation-en2fa_en2fa_tep_bleu":0.0648627292},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1578034675,"summarization_SamSUM-fa_rougeL_recall":0.3902121243,"summarization_SamSUM-fa_rougeL_f1_score":0.2156396673},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2332592983,"translation-fa2en_fa2en_tep_bleu":0.1497847918,"translation-fa2en_fa2en_mizan_bleu":0.1972270386,"translation-fa2en_fa2en_quran_bleu":0.1725699648,"translation-fa2en_fa2en_epoque_bleu":0.4678973942,"translation-fa2en_fa2en_nahj_bleu":0.090543674,"translation-fa2en_fa2en_sahife_bleu":0.1008380909},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1397574972,"translation-ar2fa_ar2fa_sahife_bleu":0.1273211367,"translation-ar2fa_ar2fa_nahj_bleu":0.0658485892,"translation-ar2fa_ar2fa_quran_bleu":0.2224073202},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1160048958,"summarization_PnSummary_rougeL_recall":0.3980422927,"summarization_PnSummary_rougeL_f1_score":0.1751797476},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0652599666,"translation-fa2ar_fa2ar_nahj_bleu":0.0373134355,"translation-fa2ar_fa2ar_sahife_bleu":0.0688517527,"translation-fa2ar_fa2ar_quran_bleu":0.0896147118},"nlg_score":0.1810678527}
         | 
| 7 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.3141052553,"question-generation_PersianQA_rougeL_recall":0.4102615831,"question-generation_PersianQA_rougeL_f1_score":0.3441804021},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1718324934,"translation-en2fa_en2fa_epoque_bleu":0.364783925,"translation-en2fa_en2fa_mizan_bleu":0.1532613543,"translation-en2fa_en2fa_quran_bleu":0.1620975016,"translation-en2fa_en2fa_sahife_bleu":0.0967871625,"translation-en2fa_en2fa_nahj_bleu":0.0457580774,"translation-en2fa_en2fa_tep_bleu":0.05756103},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1808561992,"summarization_SamSUM-fa_rougeL_recall":0.414509553,"summarization_SamSUM-fa_rougeL_f1_score":0.2406998552},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0757086487,"translation-fa2en_fa2en_tep_bleu":0.0316922994,"translation-fa2en_fa2en_mizan_bleu":0.0530331645,"translation-fa2en_fa2en_quran_bleu":0.1028139165,"translation-fa2en_fa2en_epoque_bleu":0.157367237,"translation-fa2en_fa2en_nahj_bleu":0.0336372263,"translation-fa2en_fa2en_sahife_bleu":0.0279485156},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.15661924,"translation-ar2fa_ar2fa_sahife_bleu":0.1122809429,"translation-ar2fa_ar2fa_nahj_bleu":0.0629397909,"translation-ar2fa_ar2fa_quran_bleu":0.2899530138},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1228424623,"summarization_PnSummary_rougeL_recall":0.3750771332,"summarization_PnSummary_rougeL_f1_score":0.1793201723},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.079257203,"translation-fa2ar_fa2ar_nahj_bleu":0.0338415847,"translation-fa2ar_fa2ar_sahife_bleu":0.0570744002,"translation-fa2ar_fa2ar_quran_bleu":0.146855624},"nlg_score":0.178231145}
         | 
| 8 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1693490122,"question-generation_PersianQA_rougeL_recall":0.3886090827,"question-generation_PersianQA_rougeL_f1_score":0.227277052},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1799534349,"translation-en2fa_en2fa_epoque_bleu":0.4004213933,"translation-en2fa_en2fa_mizan_bleu":0.1703393716,"translation-en2fa_en2fa_quran_bleu":0.1225698669,"translation-en2fa_en2fa_sahife_bleu":0.0832764011,"translation-en2fa_en2fa_nahj_bleu":0.0439108113,"translation-en2fa_en2fa_tep_bleu":0.0595417592},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1538512444,"summarization_SamSUM-fa_rougeL_recall":0.3849531288,"summarization_SamSUM-fa_rougeL_f1_score":0.2115502707},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2247897554,"translation-fa2en_fa2en_tep_bleu":0.1341840946,"translation-fa2en_fa2en_mizan_bleu":0.1909021288,"translation-fa2en_fa2en_quran_bleu":0.1740971535,"translation-fa2en_fa2en_epoque_bleu":0.4544315204,"translation-fa2en_fa2en_nahj_bleu":0.0877235615,"translation-fa2en_fa2en_sahife_bleu":0.0975791022},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1471879954,"translation-ar2fa_ar2fa_sahife_bleu":0.1294214814,"translation-ar2fa_ar2fa_nahj_bleu":0.0642841927,"translation-ar2fa_ar2fa_quran_bleu":0.2437131219},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1188323392,"summarization_PnSummary_rougeL_recall":0.3948447809,"summarization_PnSummary_rougeL_f1_score":0.1786530476},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0761269879,"translation-fa2ar_fa2ar_nahj_bleu":0.0321440801,"translation-fa2ar_fa2ar_sahife_bleu":0.0613632957,"translation-fa2ar_fa2ar_quran_bleu":0.134873588},"nlg_score":0.1779340777}
         | 
| @@ -10,12 +11,16 @@ | |
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2281053588,"question-generation_PersianQA_rougeL_recall":0.370933314,"question-generation_PersianQA_rougeL_f1_score":0.273363418},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1623218856,"translation-en2fa_en2fa_epoque_bleu":0.3677879105,"translation-en2fa_en2fa_mizan_bleu":0.147599732,"translation-en2fa_en2fa_quran_bleu":0.0938457658,"translation-en2fa_en2fa_sahife_bleu":0.0698903005,"translation-en2fa_en2fa_nahj_bleu":0.0435129812,"translation-en2fa_en2fa_tep_bleu":0.0620337306},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1514618398,"summarization_SamSUM-fa_rougeL_recall":0.3683020708,"summarization_SamSUM-fa_rougeL_f1_score":0.2063212948},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.217991447,"translation-fa2en_fa2en_tep_bleu":0.1271542443,"translation-fa2en_fa2en_mizan_bleu":0.1728081337,"translation-fa2en_fa2en_quran_bleu":0.158860515,"translation-fa2en_fa2en_epoque_bleu":0.4572670962,"translation-fa2en_fa2en_nahj_bleu":0.0902445729,"translation-fa2en_fa2en_sahife_bleu":0.0945000287},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0985860814,"translation-ar2fa_ar2fa_sahife_bleu":0.0857687109,"translation-ar2fa_ar2fa_nahj_bleu":0.0622600203,"translation-ar2fa_ar2fa_quran_bleu":0.1459132099},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1089978489,"summarization_PnSummary_rougeL_recall":0.3936021933,"summarization_PnSummary_rougeL_f1_score":0.1662525669},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0507003531,"translation-fa2ar_fa2ar_nahj_bleu":0.0316047659,"translation-fa2ar_fa2ar_sahife_bleu":0.0534488007,"translation-fa2ar_fa2ar_quran_bleu":0.0670474926},"nlg_score":0.1679338638}
         | 
| 11 | 
             
            {"Model Name":"gpt-4.1-nano","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1622159789,"question-generation_PersianQA_rougeL_recall":0.302597472,"question-generation_PersianQA_rougeL_f1_score":0.2021048057},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1831593088,"translation-en2fa_en2fa_epoque_bleu":0.4052150706,"translation-en2fa_en2fa_mizan_bleu":0.1692823494,"translation-en2fa_en2fa_quran_bleu":0.1400476579,"translation-en2fa_en2fa_sahife_bleu":0.0812805634,"translation-en2fa_en2fa_nahj_bleu":0.048146149,"translation-en2fa_en2fa_tep_bleu":0.0610881446},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.16175156,"summarization_SamSUM-fa_rougeL_recall":0.3477483743,"summarization_SamSUM-fa_rougeL_f1_score":0.209834706},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2165819036,"translation-fa2en_fa2en_tep_bleu":0.13491043,"translation-fa2en_fa2en_mizan_bleu":0.1810957829,"translation-fa2en_fa2en_quran_bleu":0.164168601,"translation-fa2en_fa2en_epoque_bleu":0.4383628208,"translation-fa2en_fa2en_nahj_bleu":0.0942939662,"translation-fa2en_fa2en_sahife_bleu":0.0827637394},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1315367808,"translation-ar2fa_ar2fa_sahife_bleu":0.1063921688,"translation-ar2fa_ar2fa_nahj_bleu":0.0642188893,"translation-ar2fa_ar2fa_quran_bleu":0.2206333896},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1120916238,"summarization_PnSummary_rougeL_recall":0.3610411286,"summarization_PnSummary_rougeL_f1_score":0.1660826543},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0568324844,"translation-fa2ar_fa2ar_nahj_bleu":0.03267488,"translation-fa2ar_fa2ar_sahife_bleu":0.0579381183,"translation-fa2ar_fa2ar_quran_bleu":0.0798844549},"nlg_score":0.1665903777}
         | 
| 12 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2782492277,"question-generation_PersianQA_rougeL_recall":0.3823213358,"question-generation_PersianQA_rougeL_f1_score":0.3109786075},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1750457687,"translation-en2fa_en2fa_epoque_bleu":0.3740903807,"translation-en2fa_en2fa_mizan_bleu":0.1593083308,"translation-en2fa_en2fa_quran_bleu":0.1325582833,"translation-en2fa_en2fa_sahife_bleu":0.1002994879,"translation-en2fa_en2fa_nahj_bleu":0.0501235873,"translation-en2fa_en2fa_tep_bleu":0.0652393013},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1810410242,"summarization_SamSUM-fa_rougeL_recall":0.4016180552,"summarization_SamSUM-fa_rougeL_f1_score":0.2380560527},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0858473556,"translation-fa2en_fa2en_tep_bleu":0.0381837678,"translation-fa2en_fa2en_mizan_bleu":0.0750320212,"translation-fa2en_fa2en_quran_bleu":0.0986486354,"translation-fa2en_fa2en_epoque_bleu":0.1513689047,"translation-fa2en_fa2en_nahj_bleu":0.0568182224,"translation-fa2en_fa2en_sahife_bleu":0.0570620784},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1430472928,"translation-ar2fa_ar2fa_sahife_bleu":0.1326018858,"translation-ar2fa_ar2fa_nahj_bleu":0.0532180128,"translation-ar2fa_ar2fa_quran_bleu":0.2388305158},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1191404443,"summarization_PnSummary_rougeL_recall":0.365434541,"summarization_PnSummary_rougeL_f1_score":0.1744092468},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0341529902,"translation-fa2ar_fa2ar_nahj_bleu":0.0198079243,"translation-fa2ar_fa2ar_sahife_bleu":0.041930434,"translation-fa2ar_fa2ar_quran_bleu":0.0407206123},"nlg_score":0.1659339021}
         | 
|  | |
| 13 | 
             
            {"Model Name":"c4ai-command-r-v01","thinking_method":"β","model_url":"https_google.com","parameters_count":"35000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1546246184,"question-generation_PersianQA_rougeL_recall":0.253394795,"question-generation_PersianQA_rougeL_f1_score":0.1829113647},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1506934102,"translation-en2fa_en2fa_epoque_bleu":0.2951032905,"translation-en2fa_en2fa_mizan_bleu":0.1500681264,"translation-en2fa_en2fa_quran_bleu":0.1104277702,"translation-en2fa_en2fa_sahife_bleu":0.092222972,"translation-en2fa_en2fa_nahj_bleu":0.0497623005,"translation-en2fa_en2fa_tep_bleu":0.0692905167},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1944265929,"summarization_SamSUM-fa_rougeL_recall":0.3761499249,"summarization_SamSUM-fa_rougeL_f1_score":0.242617187},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1892370035,"translation-fa2en_fa2en_tep_bleu":0.1290684643,"translation-fa2en_fa2en_mizan_bleu":0.1721408901,"translation-fa2en_fa2en_quran_bleu":0.1736791408,"translation-fa2en_fa2en_epoque_bleu":0.346100597,"translation-fa2en_fa2en_nahj_bleu":0.0776400174,"translation-fa2en_fa2en_sahife_bleu":0.08279759},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1144863268,"translation-ar2fa_ar2fa_sahife_bleu":0.1190971594,"translation-ar2fa_ar2fa_nahj_bleu":0.0648109303,"translation-ar2fa_ar2fa_quran_bleu":0.157067121},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1298447221,"summarization_PnSummary_rougeL_recall":0.3548911672,"summarization_PnSummary_rougeL_f1_score":0.1841564462},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0852951832,"translation-fa2ar_fa2ar_nahj_bleu":0.0464072569,"translation-fa2ar_fa2ar_sahife_bleu":0.0713426227,"translation-fa2ar_fa2ar_quran_bleu":0.1381356701},"nlg_score":0.1641995602}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1996840686,"question-generation_PersianQA_rougeL_recall":0.3393114266,"question-generation_PersianQA_rougeL_f1_score":0.2417040176},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1617787549,"translation-en2fa_en2fa_epoque_bleu":0.3821529147,"translation-en2fa_en2fa_mizan_bleu":0.1337537913,"translation-en2fa_en2fa_quran_bleu":0.0860909143,"translation-en2fa_en2fa_sahife_bleu":0.0770506908,"translation-en2fa_en2fa_nahj_bleu":0.0441728515,"translation-en2fa_en2fa_tep_bleu":0.0587014819},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1523824175,"summarization_SamSUM-fa_rougeL_recall":0.3838683519,"summarization_SamSUM-fa_rougeL_f1_score":0.2083553767},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2177785793,"translation-fa2en_fa2en_tep_bleu":0.1189948472,"translation-fa2en_fa2en_mizan_bleu":0.1793626928,"translation-fa2en_fa2en_quran_bleu":0.1718006478,"translation-fa2en_fa2en_epoque_bleu":0.4500382308,"translation-fa2en_fa2en_nahj_bleu":0.0836776138,"translation-fa2en_fa2en_sahife_bleu":0.1034067477},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.090408759,"translation-ar2fa_ar2fa_sahife_bleu":0.0778953352,"translation-ar2fa_ar2fa_nahj_bleu":0.0610049198,"translation-ar2fa_ar2fa_quran_bleu":0.13085583},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1212751301,"summarization_PnSummary_rougeL_recall":0.3923323141,"summarization_PnSummary_rougeL_f1_score":0.1804727387},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0483297895,"translation-fa2ar_fa2ar_nahj_bleu":0.0310247441,"translation-fa2ar_fa2ar_sahife_bleu":0.0512375201,"translation-fa2ar_fa2ar_quran_bleu":0.0627271043},"nlg_score":0.164118288}
         | 
| 15 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1987198912,"question-generation_PersianQA_rougeL_recall":0.3431437262,"question-generation_PersianQA_rougeL_f1_score":0.2419384398},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1535253787,"translation-en2fa_en2fa_epoque_bleu":0.3553678809,"translation-en2fa_en2fa_mizan_bleu":0.1285441922,"translation-en2fa_en2fa_quran_bleu":0.0857809616,"translation-en2fa_en2fa_sahife_bleu":0.0787025343,"translation-en2fa_en2fa_nahj_bleu":0.0404850935,"translation-en2fa_en2fa_tep_bleu":0.0586129062},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1469468837,"summarization_SamSUM-fa_rougeL_recall":0.3743807014,"summarization_SamSUM-fa_rougeL_f1_score":0.2022859929},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2145488085,"translation-fa2en_fa2en_tep_bleu":0.1307272464,"translation-fa2en_fa2en_mizan_bleu":0.1697754862,"translation-fa2en_fa2en_quran_bleu":0.1552415558,"translation-fa2en_fa2en_epoque_bleu":0.4513682579,"translation-fa2en_fa2en_nahj_bleu":0.0842673472,"translation-fa2en_fa2en_sahife_bleu":0.0853787118},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0910450298,"translation-ar2fa_ar2fa_sahife_bleu":0.0862679894,"translation-ar2fa_ar2fa_nahj_bleu":0.0558129824,"translation-ar2fa_ar2fa_quran_bleu":0.1292925153},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1123870374,"summarization_PnSummary_rougeL_recall":0.4032007327,"summarization_PnSummary_rougeL_f1_score":0.17115848},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0494411806,"translation-fa2ar_fa2ar_nahj_bleu":0.0369805868,"translation-fa2ar_fa2ar_sahife_bleu":0.0567654991,"translation-fa2ar_fa2ar_quran_bleu":0.0545774559},"nlg_score":0.16056333}
         | 
|  | |
| 16 | 
             
            {"Model Name":"Qwen3-8B","thinking_method":"β","model_url":"https_google.com","parameters_count":"8190000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1965366702,"question-generation_PersianQA_rougeL_recall":0.340760284,"question-generation_PersianQA_rougeL_f1_score":0.2388923895},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1550276898,"translation-en2fa_en2fa_epoque_bleu":0.3721582216,"translation-en2fa_en2fa_mizan_bleu":0.1231599039,"translation-en2fa_en2fa_quran_bleu":0.0882213453,"translation-en2fa_en2fa_sahife_bleu":0.0725213197,"translation-en2fa_en2fa_nahj_bleu":0.0424186358,"translation-en2fa_en2fa_tep_bleu":0.0528718634},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1463365551,"summarization_SamSUM-fa_rougeL_recall":0.3856017289,"summarization_SamSUM-fa_rougeL_f1_score":0.2024070197},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2024225184,"translation-fa2en_fa2en_tep_bleu":0.1163127945,"translation-fa2en_fa2en_mizan_bleu":0.1649009947,"translation-fa2en_fa2en_quran_bleu":0.1513328968,"translation-fa2en_fa2en_epoque_bleu":0.4171232399,"translation-fa2en_fa2en_nahj_bleu":0.0857999462,"translation-fa2en_fa2en_sahife_bleu":0.0929479364},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0821020713,"translation-ar2fa_ar2fa_sahife_bleu":0.0730469461,"translation-ar2fa_ar2fa_nahj_bleu":0.0579031327,"translation-ar2fa_ar2fa_quran_bleu":0.1141461882},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.109255822,"summarization_PnSummary_rougeL_recall":0.3979273385,"summarization_PnSummary_rougeL_f1_score":0.1669061111},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0423318046,"translation-fa2ar_fa2ar_nahj_bleu":0.0329089717,"translation-fa2ar_fa2ar_sahife_bleu":0.0445101244,"translation-fa2ar_fa2ar_quran_bleu":0.0495763178},"nlg_score":0.1557270864}
         | 
|  | |
| 17 | 
             
            {"Model Name":"Qwen3-4B","thinking_method":"β","model_url":"https_google.com","parameters_count":"4020000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1744197112,"question-generation_PersianQA_rougeL_recall":0.2697024508,"question-generation_PersianQA_rougeL_f1_score":0.2017710943},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1217211215,"translation-en2fa_en2fa_epoque_bleu":0.2916268514,"translation-en2fa_en2fa_mizan_bleu":0.091925603,"translation-en2fa_en2fa_quran_bleu":0.065498518,"translation-en2fa_en2fa_sahife_bleu":0.0612237455,"translation-en2fa_en2fa_nahj_bleu":0.0385824628,"translation-en2fa_en2fa_tep_bleu":0.0453883692},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1429609514,"summarization_SamSUM-fa_rougeL_recall":0.397717388,"summarization_SamSUM-fa_rougeL_f1_score":0.2013136641},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1840809218,"translation-fa2en_fa2en_tep_bleu":0.1011436783,"translation-fa2en_fa2en_mizan_bleu":0.149157222,"translation-fa2en_fa2en_quran_bleu":0.1377761662,"translation-fa2en_fa2en_epoque_bleu":0.3802946233,"translation-fa2en_fa2en_nahj_bleu":0.0851756367,"translation-fa2en_fa2en_sahife_bleu":0.0857201524},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0636385541,"translation-ar2fa_ar2fa_sahife_bleu":0.0557180428,"translation-ar2fa_ar2fa_nahj_bleu":0.0539968488,"translation-ar2fa_ar2fa_quran_bleu":0.0807186853},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1067208324,"summarization_PnSummary_rougeL_recall":0.4109136551,"summarization_PnSummary_rougeL_f1_score":0.1648475797},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0351351131,"translation-fa2ar_fa2ar_nahj_bleu":0.0313503027,"translation-fa2ar_fa2ar_sahife_bleu":0.042075565,"translation-fa2ar_fa2ar_quran_bleu":0.0319794715},"nlg_score":0.1389297212}
         | 
| 18 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.3121385499,"question-generation_PersianQA_rougeL_recall":0.4162991047,"question-generation_PersianQA_rougeL_f1_score":0.3445136596},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.0650794176,"translation-en2fa_en2fa_epoque_bleu":0.1194375779,"translation-en2fa_en2fa_mizan_bleu":0.0640649978,"translation-en2fa_en2fa_quran_bleu":0.0926514743,"translation-en2fa_en2fa_sahife_bleu":0.0392464347,"translation-en2fa_en2fa_nahj_bleu":0.022322883,"translation-en2fa_en2fa_tep_bleu":0.0184227674},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1525978605,"summarization_SamSUM-fa_rougeL_recall":0.3945587249,"summarization_SamSUM-fa_rougeL_f1_score":0.209852471},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0559484689,"translation-fa2en_fa2en_tep_bleu":0.0190401646,"translation-fa2en_fa2en_mizan_bleu":0.0369126121,"translation-fa2en_fa2en_quran_bleu":0.0401048971,"translation-fa2en_fa2en_epoque_bleu":0.1381975553,"translation-fa2en_fa2en_nahj_bleu":0.0232788817,"translation-fa2en_fa2en_sahife_bleu":0.017477039},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0772188097,"translation-ar2fa_ar2fa_sahife_bleu":0.0610321929,"translation-ar2fa_ar2fa_nahj_bleu":0.0273061824,"translation-ar2fa_ar2fa_quran_bleu":0.1408224224},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1070140366,"summarization_PnSummary_rougeL_recall":0.4357356292,"summarization_PnSummary_rougeL_f1_score":0.1672508999},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0382543341,"translation-fa2ar_fa2ar_nahj_bleu":0.032191006,"translation-fa2ar_fa2ar_sahife_bleu":0.028980881,"translation-fa2ar_fa2ar_quran_bleu":0.0535911152},"nlg_score":0.1368740087}
         | 
|  | |
| 19 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1520819517,"question-generation_PersianQA_rougeL_recall":0.26324767,"question-generation_PersianQA_rougeL_f1_score":0.1843401988},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1458447378,"translation-en2fa_en2fa_epoque_bleu":0.3541508677,"translation-en2fa_en2fa_mizan_bleu":0.1259468635,"translation-en2fa_en2fa_quran_bleu":0.0887225632,"translation-en2fa_en2fa_sahife_bleu":0.0672732746,"translation-en2fa_en2fa_nahj_bleu":0.0407327793,"translation-en2fa_en2fa_tep_bleu":0.0293172873},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.147286408,"summarization_SamSUM-fa_rougeL_recall":0.4066657958,"summarization_SamSUM-fa_rougeL_f1_score":0.2072278176},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1451163884,"translation-fa2en_fa2en_tep_bleu":0.0393307601,"translation-fa2en_fa2en_mizan_bleu":0.1009347025,"translation-fa2en_fa2en_quran_bleu":0.0929688918,"translation-fa2en_fa2en_epoque_bleu":0.3660914464,"translation-fa2en_fa2en_nahj_bleu":0.0536507876,"translation-fa2en_fa2en_sahife_bleu":0.05038339},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0594554675,"translation-ar2fa_ar2fa_sahife_bleu":0.0539986603,"translation-ar2fa_ar2fa_nahj_bleu":0.035240584,"translation-ar2fa_ar2fa_quran_bleu":0.0879164142},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1029257145,"summarization_PnSummary_rougeL_recall":0.4347811424,"summarization_PnSummary_rougeL_f1_score":0.1621438757},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0192357288,"translation-fa2ar_fa2ar_nahj_bleu":0.0151369319,"translation-fa2ar_fa2ar_sahife_bleu":0.0245784397,"translation-fa2ar_fa2ar_quran_bleu":0.0179918148},"nlg_score":0.1319091735}
         | 
| 20 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2572991833,"question-generation_PersianQA_rougeL_recall":0.3740225235,"question-generation_PersianQA_rougeL_f1_score":0.2927586837},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.08817485,"translation-en2fa_en2fa_epoque_bleu":0.1886801725,"translation-en2fa_en2fa_mizan_bleu":0.0879987558,"translation-en2fa_en2fa_quran_bleu":0.0657922023,"translation-en2fa_en2fa_sahife_bleu":0.0296141618,"translation-en2fa_en2fa_nahj_bleu":0.0192266597,"translation-en2fa_en2fa_tep_bleu":0.0366296874},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1658145118,"summarization_SamSUM-fa_rougeL_recall":0.3677760479,"summarization_SamSUM-fa_rougeL_f1_score":0.2189237562},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0257184881,"translation-fa2en_fa2en_tep_bleu":0.011593122,"translation-fa2en_fa2en_mizan_bleu":0.0215328963,"translation-fa2en_fa2en_quran_bleu":0.0262056878,"translation-fa2en_fa2en_epoque_bleu":0.047221295,"translation-fa2en_fa2en_nahj_bleu":0.0178557856,"translation-fa2en_fa2en_sahife_bleu":0.0169922826},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.032619077,"translation-ar2fa_ar2fa_sahife_bleu":0.0333185867,"translation-ar2fa_ar2fa_nahj_bleu":0.0106299838,"translation-ar2fa_ar2fa_quran_bleu":0.0528092057},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1156871575,"summarization_PnSummary_rougeL_recall":0.3630716995,"summarization_PnSummary_rougeL_f1_score":0.1697348346},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0098333287,"translation-fa2ar_fa2ar_nahj_bleu":0.0072190824,"translation-fa2ar_fa2ar_sahife_bleu":0.0110570977,"translation-fa2ar_fa2ar_quran_bleu":0.0112238061},"nlg_score":0.1196804312}
         | 
| 21 | 
             
            {"Model Name":"aya-expanse-32b","thinking_method":"β","model_url":"https_google.com","parameters_count":"32300000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.0980160864,"question-generation_PersianQA_rougeL_recall":0.347983913,"question-generation_PersianQA_rougeL_f1_score":0.1443872083},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.0951102411,"translation-en2fa_en2fa_epoque_bleu":0.2204131973,"translation-en2fa_en2fa_mizan_bleu":0.0772021612,"translation-en2fa_en2fa_quran_bleu":0.0914129011,"translation-en2fa_en2fa_sahife_bleu":0.0555605793,"translation-en2fa_en2fa_nahj_bleu":0.0296371925,"translation-en2fa_en2fa_tep_bleu":0.0145962694},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1338082958,"summarization_SamSUM-fa_rougeL_recall":0.397938928,"summarization_SamSUM-fa_rougeL_f1_score":0.1933390916},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.14443262,"translation-fa2en_fa2en_tep_bleu":0.0636878051,"translation-fa2en_fa2en_mizan_bleu":0.1045784226,"translation-fa2en_fa2en_quran_bleu":0.1065169191,"translation-fa2en_fa2en_epoque_bleu":0.3331896819,"translation-fa2en_fa2en_nahj_bleu":0.0573420672,"translation-fa2en_fa2en_sahife_bleu":0.0526154809},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0608470749,"translation-ar2fa_ar2fa_sahife_bleu":0.0636783644,"translation-ar2fa_ar2fa_nahj_bleu":0.0258604511,"translation-ar2fa_ar2fa_quran_bleu":0.091253078},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1094933227,"summarization_PnSummary_rougeL_recall":0.3979476995,"summarization_PnSummary_rougeL_f1_score":0.1674664883},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0318976507,"translation-fa2ar_fa2ar_nahj_bleu":0.0222927973,"translation-fa2ar_fa2ar_sahife_bleu":0.0296757253,"translation-fa2ar_fa2ar_quran_bleu":0.0437244293},"nlg_score":0.1196400535}
         | 
|  | |
| 3 | 
             
            {"Model Name":"gpt-4.1-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2438951227,"question-generation_PersianQA_rougeL_recall":0.3687301621,"question-generation_PersianQA_rougeL_f1_score":0.2816187853},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1979467916,"translation-en2fa_en2fa_epoque_bleu":0.4460981632,"translation-en2fa_en2fa_mizan_bleu":0.1745376389,"translation-en2fa_en2fa_quran_bleu":0.137406774,"translation-en2fa_en2fa_sahife_bleu":0.091586235,"translation-en2fa_en2fa_nahj_bleu":0.0490159552,"translation-en2fa_en2fa_tep_bleu":0.072776086},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.171454009,"summarization_SamSUM-fa_rougeL_recall":0.3692597258,"summarization_SamSUM-fa_rougeL_f1_score":0.2248722593},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2389011537,"translation-fa2en_fa2en_tep_bleu":0.1431825698,"translation-fa2en_fa2en_mizan_bleu":0.2056729072,"translation-fa2en_fa2en_quran_bleu":0.1776018574,"translation-fa2en_fa2en_epoque_bleu":0.4842161688,"translation-fa2en_fa2en_nahj_bleu":0.0886384727,"translation-fa2en_fa2en_sahife_bleu":0.1045044839},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.143500711,"translation-ar2fa_ar2fa_sahife_bleu":0.1221294429,"translation-ar2fa_ar2fa_nahj_bleu":0.069521493,"translation-ar2fa_ar2fa_quran_bleu":0.235152236},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1156493376,"summarization_PnSummary_rougeL_recall":0.403347998,"summarization_PnSummary_rougeL_f1_score":0.1750055649},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0689994984,"translation-fa2ar_fa2ar_nahj_bleu":0.0397020785,"translation-fa2ar_fa2ar_sahife_bleu":0.0751264317,"translation-fa2ar_fa2ar_quran_bleu":0.092169985},"nlg_score":0.1901206806}
         | 
| 4 | 
             
            {"Model Name":"gpt-4o","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2275858051,"question-generation_PersianQA_rougeL_recall":0.3654754607,"question-generation_PersianQA_rougeL_f1_score":0.2679025722},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.2099911906,"translation-en2fa_en2fa_epoque_bleu":0.4805793807,"translation-en2fa_en2fa_mizan_bleu":0.1904867707,"translation-en2fa_en2fa_quran_bleu":0.1412389522,"translation-en2fa_en2fa_sahife_bleu":0.0861059288,"translation-en2fa_en2fa_nahj_bleu":0.0528683421,"translation-en2fa_en2fa_tep_bleu":0.0688528109},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.165108522,"summarization_SamSUM-fa_rougeL_recall":0.3982318891,"summarization_SamSUM-fa_rougeL_f1_score":0.2240082992},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.234039473,"translation-fa2en_fa2en_tep_bleu":0.1597644653,"translation-fa2en_fa2en_mizan_bleu":0.1946759365,"translation-fa2en_fa2en_quran_bleu":0.1638938233,"translation-fa2en_fa2en_epoque_bleu":0.474760879,"translation-fa2en_fa2en_nahj_bleu":0.0825458621,"translation-fa2en_fa2en_sahife_bleu":0.0952634494},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1542520457,"translation-ar2fa_ar2fa_sahife_bleu":0.1283925803,"translation-ar2fa_ar2fa_nahj_bleu":0.0660434951,"translation-ar2fa_ar2fa_quran_bleu":0.2639096342},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1134979628,"summarization_PnSummary_rougeL_recall":0.3909794734,"summarization_PnSummary_rougeL_f1_score":0.1716841943},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0656699851,"translation-fa2ar_fa2ar_nahj_bleu":0.0347167128,"translation-fa2ar_fa2ar_sahife_bleu":0.0732417084,"translation-fa2ar_fa2ar_quran_bleu":0.0890515341},"nlg_score":0.18964968}
         | 
| 5 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https_google.com","parameters_count":"104000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2149535143,"question-generation_PersianQA_rougeL_recall":0.3019561885,"question-generation_PersianQA_rougeL_f1_score":0.2405115465},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.2018158808,"translation-en2fa_en2fa_epoque_bleu":0.4332944681,"translation-en2fa_en2fa_mizan_bleu":0.1925182751,"translation-en2fa_en2fa_quran_bleu":0.1530925462,"translation-en2fa_en2fa_sahife_bleu":0.1026499453,"translation-en2fa_en2fa_nahj_bleu":0.051968827,"translation-en2fa_en2fa_tep_bleu":0.0708487287},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1591262985,"summarization_SamSUM-fa_rougeL_recall":0.4163090512,"summarization_SamSUM-fa_rougeL_f1_score":0.2208876443},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2337569687,"translation-fa2en_fa2en_tep_bleu":0.1386371644,"translation-fa2en_fa2en_mizan_bleu":0.2129637469,"translation-fa2en_fa2en_quran_bleu":0.1702102457,"translation-fa2en_fa2en_epoque_bleu":0.478211182,"translation-fa2en_fa2en_nahj_bleu":0.083013513,"translation-fa2en_fa2en_sahife_bleu":0.072000292},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1414109272,"translation-ar2fa_ar2fa_sahife_bleu":0.136408042,"translation-ar2fa_ar2fa_nahj_bleu":0.0653197648,"translation-ar2fa_ar2fa_quran_bleu":0.2187004167},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1227039295,"summarization_PnSummary_rougeL_recall":0.4315497639,"summarization_PnSummary_rougeL_f1_score":0.1856517383},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0922998074,"translation-fa2ar_fa2ar_nahj_bleu":0.0511154919,"translation-fa2ar_fa2ar_sahife_bleu":0.0589808221,"translation-fa2ar_fa2ar_quran_bleu":0.1668031083},"nlg_score":0.1880477876}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2602516122,"question-generation_PersianQA_rougeL_recall":0.3803807526,"question-generation_PersianQA_rougeL_f1_score":0.2967852302},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1757431213,"translation-en2fa_en2fa_epoque_bleu":0.3745398253,"translation-en2fa_en2fa_mizan_bleu":0.1640890656,"translation-en2fa_en2fa_quran_bleu":0.1377843747,"translation-en2fa_en2fa_sahife_bleu":0.0895949257,"translation-en2fa_en2fa_nahj_bleu":0.0437585905,"translation-en2fa_en2fa_tep_bleu":0.0679088622},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1553547312,"summarization_SamSUM-fa_rougeL_recall":0.3357735524,"summarization_SamSUM-fa_rougeL_f1_score":0.2045988783},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2435498156,"translation-fa2en_fa2en_tep_bleu":0.1656898075,"translation-fa2en_fa2en_mizan_bleu":0.2055420364,"translation-fa2en_fa2en_quran_bleu":0.1726910304,"translation-fa2en_fa2en_epoque_bleu":0.4912890145,"translation-fa2en_fa2en_nahj_bleu":0.0882784037,"translation-fa2en_fa2en_sahife_bleu":0.0952319793},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1334075162,"translation-ar2fa_ar2fa_sahife_bleu":0.1143867102,"translation-ar2fa_ar2fa_nahj_bleu":0.063272709,"translation-ar2fa_ar2fa_quran_bleu":0.2190563892},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.0917305447,"summarization_PnSummary_rougeL_recall":0.3893845098,"summarization_PnSummary_rougeL_f1_score":0.1447284086},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0720575119,"translation-fa2ar_fa2ar_nahj_bleu":0.037394526,"translation-fa2ar_fa2ar_sahife_bleu":0.0636064419,"translation-fa2ar_fa2ar_quran_bleu":0.1151715676},"nlg_score":0.181552926}
         | 
| 7 | 
             
            {"Model Name":"gpt-4o-mini","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1942536013,"question-generation_PersianQA_rougeL_recall":0.3435531442,"question-generation_PersianQA_rougeL_f1_score":0.2369359061},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.2014428857,"translation-en2fa_en2fa_epoque_bleu":0.4710672433,"translation-en2fa_en2fa_mizan_bleu":0.1830885263,"translation-en2fa_en2fa_quran_bleu":0.1141518863,"translation-en2fa_en2fa_sahife_bleu":0.0806159411,"translation-en2fa_en2fa_nahj_bleu":0.0504089542,"translation-en2fa_en2fa_tep_bleu":0.0648627292},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1578034675,"summarization_SamSUM-fa_rougeL_recall":0.3902121243,"summarization_SamSUM-fa_rougeL_f1_score":0.2156396673},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2332592983,"translation-fa2en_fa2en_tep_bleu":0.1497847918,"translation-fa2en_fa2en_mizan_bleu":0.1972270386,"translation-fa2en_fa2en_quran_bleu":0.1725699648,"translation-fa2en_fa2en_epoque_bleu":0.4678973942,"translation-fa2en_fa2en_nahj_bleu":0.090543674,"translation-fa2en_fa2en_sahife_bleu":0.1008380909},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1397574972,"translation-ar2fa_ar2fa_sahife_bleu":0.1273211367,"translation-ar2fa_ar2fa_nahj_bleu":0.0658485892,"translation-ar2fa_ar2fa_quran_bleu":0.2224073202},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1160048958,"summarization_PnSummary_rougeL_recall":0.3980422927,"summarization_PnSummary_rougeL_f1_score":0.1751797476},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0652599666,"translation-fa2ar_fa2ar_nahj_bleu":0.0373134355,"translation-fa2ar_fa2ar_sahife_bleu":0.0688517527,"translation-fa2ar_fa2ar_quran_bleu":0.0896147118},"nlg_score":0.1810678527}
         | 
| 8 | 
             
            {"Model Name":"gemini-2.0-flash","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.3141052553,"question-generation_PersianQA_rougeL_recall":0.4102615831,"question-generation_PersianQA_rougeL_f1_score":0.3441804021},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1718324934,"translation-en2fa_en2fa_epoque_bleu":0.364783925,"translation-en2fa_en2fa_mizan_bleu":0.1532613543,"translation-en2fa_en2fa_quran_bleu":0.1620975016,"translation-en2fa_en2fa_sahife_bleu":0.0967871625,"translation-en2fa_en2fa_nahj_bleu":0.0457580774,"translation-en2fa_en2fa_tep_bleu":0.05756103},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1808561992,"summarization_SamSUM-fa_rougeL_recall":0.414509553,"summarization_SamSUM-fa_rougeL_f1_score":0.2406998552},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0757086487,"translation-fa2en_fa2en_tep_bleu":0.0316922994,"translation-fa2en_fa2en_mizan_bleu":0.0530331645,"translation-fa2en_fa2en_quran_bleu":0.1028139165,"translation-fa2en_fa2en_epoque_bleu":0.157367237,"translation-fa2en_fa2en_nahj_bleu":0.0336372263,"translation-fa2en_fa2en_sahife_bleu":0.0279485156},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.15661924,"translation-ar2fa_ar2fa_sahife_bleu":0.1122809429,"translation-ar2fa_ar2fa_nahj_bleu":0.0629397909,"translation-ar2fa_ar2fa_quran_bleu":0.2899530138},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1228424623,"summarization_PnSummary_rougeL_recall":0.3750771332,"summarization_PnSummary_rougeL_f1_score":0.1793201723},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.079257203,"translation-fa2ar_fa2ar_nahj_bleu":0.0338415847,"translation-fa2ar_fa2ar_sahife_bleu":0.0570744002,"translation-fa2ar_fa2ar_quran_bleu":0.146855624},"nlg_score":0.178231145}
         | 
| 9 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1693490122,"question-generation_PersianQA_rougeL_recall":0.3886090827,"question-generation_PersianQA_rougeL_f1_score":0.227277052},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1799534349,"translation-en2fa_en2fa_epoque_bleu":0.4004213933,"translation-en2fa_en2fa_mizan_bleu":0.1703393716,"translation-en2fa_en2fa_quran_bleu":0.1225698669,"translation-en2fa_en2fa_sahife_bleu":0.0832764011,"translation-en2fa_en2fa_nahj_bleu":0.0439108113,"translation-en2fa_en2fa_tep_bleu":0.0595417592},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1538512444,"summarization_SamSUM-fa_rougeL_recall":0.3849531288,"summarization_SamSUM-fa_rougeL_f1_score":0.2115502707},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2247897554,"translation-fa2en_fa2en_tep_bleu":0.1341840946,"translation-fa2en_fa2en_mizan_bleu":0.1909021288,"translation-fa2en_fa2en_quran_bleu":0.1740971535,"translation-fa2en_fa2en_epoque_bleu":0.4544315204,"translation-fa2en_fa2en_nahj_bleu":0.0877235615,"translation-fa2en_fa2en_sahife_bleu":0.0975791022},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1471879954,"translation-ar2fa_ar2fa_sahife_bleu":0.1294214814,"translation-ar2fa_ar2fa_nahj_bleu":0.0642841927,"translation-ar2fa_ar2fa_quran_bleu":0.2437131219},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1188323392,"summarization_PnSummary_rougeL_recall":0.3948447809,"summarization_PnSummary_rougeL_f1_score":0.1786530476},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0761269879,"translation-fa2ar_fa2ar_nahj_bleu":0.0321440801,"translation-fa2ar_fa2ar_sahife_bleu":0.0613632957,"translation-fa2ar_fa2ar_quran_bleu":0.134873588},"nlg_score":0.1779340777}
         | 
|  | |
| 11 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https_google.com","parameters_count":"32800000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2281053588,"question-generation_PersianQA_rougeL_recall":0.370933314,"question-generation_PersianQA_rougeL_f1_score":0.273363418},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1623218856,"translation-en2fa_en2fa_epoque_bleu":0.3677879105,"translation-en2fa_en2fa_mizan_bleu":0.147599732,"translation-en2fa_en2fa_quran_bleu":0.0938457658,"translation-en2fa_en2fa_sahife_bleu":0.0698903005,"translation-en2fa_en2fa_nahj_bleu":0.0435129812,"translation-en2fa_en2fa_tep_bleu":0.0620337306},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1514618398,"summarization_SamSUM-fa_rougeL_recall":0.3683020708,"summarization_SamSUM-fa_rougeL_f1_score":0.2063212948},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.217991447,"translation-fa2en_fa2en_tep_bleu":0.1271542443,"translation-fa2en_fa2en_mizan_bleu":0.1728081337,"translation-fa2en_fa2en_quran_bleu":0.158860515,"translation-fa2en_fa2en_epoque_bleu":0.4572670962,"translation-fa2en_fa2en_nahj_bleu":0.0902445729,"translation-fa2en_fa2en_sahife_bleu":0.0945000287},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0985860814,"translation-ar2fa_ar2fa_sahife_bleu":0.0857687109,"translation-ar2fa_ar2fa_nahj_bleu":0.0622600203,"translation-ar2fa_ar2fa_quran_bleu":0.1459132099},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1089978489,"summarization_PnSummary_rougeL_recall":0.3936021933,"summarization_PnSummary_rougeL_f1_score":0.1662525669},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0507003531,"translation-fa2ar_fa2ar_nahj_bleu":0.0316047659,"translation-fa2ar_fa2ar_sahife_bleu":0.0534488007,"translation-fa2ar_fa2ar_quran_bleu":0.0670474926},"nlg_score":0.1679338638}
         | 
| 12 | 
             
            {"Model Name":"gpt-4.1-nano","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1622159789,"question-generation_PersianQA_rougeL_recall":0.302597472,"question-generation_PersianQA_rougeL_f1_score":0.2021048057},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1831593088,"translation-en2fa_en2fa_epoque_bleu":0.4052150706,"translation-en2fa_en2fa_mizan_bleu":0.1692823494,"translation-en2fa_en2fa_quran_bleu":0.1400476579,"translation-en2fa_en2fa_sahife_bleu":0.0812805634,"translation-en2fa_en2fa_nahj_bleu":0.048146149,"translation-en2fa_en2fa_tep_bleu":0.0610881446},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.16175156,"summarization_SamSUM-fa_rougeL_recall":0.3477483743,"summarization_SamSUM-fa_rougeL_f1_score":0.209834706},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2165819036,"translation-fa2en_fa2en_tep_bleu":0.13491043,"translation-fa2en_fa2en_mizan_bleu":0.1810957829,"translation-fa2en_fa2en_quran_bleu":0.164168601,"translation-fa2en_fa2en_epoque_bleu":0.4383628208,"translation-fa2en_fa2en_nahj_bleu":0.0942939662,"translation-fa2en_fa2en_sahife_bleu":0.0827637394},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1315367808,"translation-ar2fa_ar2fa_sahife_bleu":0.1063921688,"translation-ar2fa_ar2fa_nahj_bleu":0.0642188893,"translation-ar2fa_ar2fa_quran_bleu":0.2206333896},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1120916238,"summarization_PnSummary_rougeL_recall":0.3610411286,"summarization_PnSummary_rougeL_f1_score":0.1660826543},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0568324844,"translation-fa2ar_fa2ar_nahj_bleu":0.03267488,"translation-fa2ar_fa2ar_sahife_bleu":0.0579381183,"translation-fa2ar_fa2ar_quran_bleu":0.0798844549},"nlg_score":0.1665903777}
         | 
| 13 | 
             
            {"Model Name":"gemini-2.0-flash-lite","thinking_method":"β","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2782492277,"question-generation_PersianQA_rougeL_recall":0.3823213358,"question-generation_PersianQA_rougeL_f1_score":0.3109786075},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1750457687,"translation-en2fa_en2fa_epoque_bleu":0.3740903807,"translation-en2fa_en2fa_mizan_bleu":0.1593083308,"translation-en2fa_en2fa_quran_bleu":0.1325582833,"translation-en2fa_en2fa_sahife_bleu":0.1002994879,"translation-en2fa_en2fa_nahj_bleu":0.0501235873,"translation-en2fa_en2fa_tep_bleu":0.0652393013},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1810410242,"summarization_SamSUM-fa_rougeL_recall":0.4016180552,"summarization_SamSUM-fa_rougeL_f1_score":0.2380560527},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0858473556,"translation-fa2en_fa2en_tep_bleu":0.0381837678,"translation-fa2en_fa2en_mizan_bleu":0.0750320212,"translation-fa2en_fa2en_quran_bleu":0.0986486354,"translation-fa2en_fa2en_epoque_bleu":0.1513689047,"translation-fa2en_fa2en_nahj_bleu":0.0568182224,"translation-fa2en_fa2en_sahife_bleu":0.0570620784},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1430472928,"translation-ar2fa_ar2fa_sahife_bleu":0.1326018858,"translation-ar2fa_ar2fa_nahj_bleu":0.0532180128,"translation-ar2fa_ar2fa_quran_bleu":0.2388305158},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1191404443,"summarization_PnSummary_rougeL_recall":0.365434541,"summarization_PnSummary_rougeL_f1_score":0.1744092468},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0341529902,"translation-fa2ar_fa2ar_nahj_bleu":0.0198079243,"translation-fa2ar_fa2ar_sahife_bleu":0.041930434,"translation-fa2ar_fa2ar_quran_bleu":0.0407206123},"nlg_score":0.1659339021}
         | 
| 14 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2221178335,"question-generation_PersianQA_rougeL_recall":0.335306645,"question-generation_PersianQA_rougeL_f1_score":0.2552875817},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1700971031,"translation-en2fa_en2fa_epoque_bleu":0.3619925896,"translation-en2fa_en2fa_mizan_bleu":0.1638764762,"translation-en2fa_en2fa_quran_bleu":0.1169026899,"translation-en2fa_en2fa_sahife_bleu":0.0785107337,"translation-en2fa_en2fa_nahj_bleu":0.0463016599,"translation-en2fa_en2fa_tep_bleu":0.0704424388},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1387162197,"summarization_SamSUM-fa_rougeL_recall":0.3472256524,"summarization_SamSUM-fa_rougeL_f1_score":0.1899415698},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2293783795,"translation-fa2en_fa2en_tep_bleu":0.1348246647,"translation-fa2en_fa2en_mizan_bleu":0.1880942935,"translation-fa2en_fa2en_quran_bleu":0.1642751236,"translation-fa2en_fa2en_epoque_bleu":0.4821448205,"translation-fa2en_fa2en_nahj_bleu":0.0857659109,"translation-fa2en_fa2en_sahife_bleu":0.0914041173},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1183647194,"translation-ar2fa_ar2fa_sahife_bleu":0.0905358622,"translation-ar2fa_ar2fa_nahj_bleu":0.0522591914,"translation-ar2fa_ar2fa_quran_bleu":0.2089938281},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.0830986853,"summarization_PnSummary_rougeL_recall":0.3565850313,"summarization_PnSummary_rougeL_f1_score":0.1308633101},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0564204856,"translation-fa2ar_fa2ar_nahj_bleu":0.0345882932,"translation-fa2ar_fa2ar_sahife_bleu":0.0554604649,"translation-fa2ar_fa2ar_quran_bleu":0.0792126988},"nlg_score":0.1643361642}
         | 
| 15 | 
             
            {"Model Name":"c4ai-command-r-v01","thinking_method":"β","model_url":"https_google.com","parameters_count":"35000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1546246184,"question-generation_PersianQA_rougeL_recall":0.253394795,"question-generation_PersianQA_rougeL_f1_score":0.1829113647},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1506934102,"translation-en2fa_en2fa_epoque_bleu":0.2951032905,"translation-en2fa_en2fa_mizan_bleu":0.1500681264,"translation-en2fa_en2fa_quran_bleu":0.1104277702,"translation-en2fa_en2fa_sahife_bleu":0.092222972,"translation-en2fa_en2fa_nahj_bleu":0.0497623005,"translation-en2fa_en2fa_tep_bleu":0.0692905167},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1944265929,"summarization_SamSUM-fa_rougeL_recall":0.3761499249,"summarization_SamSUM-fa_rougeL_f1_score":0.242617187},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1892370035,"translation-fa2en_fa2en_tep_bleu":0.1290684643,"translation-fa2en_fa2en_mizan_bleu":0.1721408901,"translation-fa2en_fa2en_quran_bleu":0.1736791408,"translation-fa2en_fa2en_epoque_bleu":0.346100597,"translation-fa2en_fa2en_nahj_bleu":0.0776400174,"translation-fa2en_fa2en_sahife_bleu":0.08279759},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.1144863268,"translation-ar2fa_ar2fa_sahife_bleu":0.1190971594,"translation-ar2fa_ar2fa_nahj_bleu":0.0648109303,"translation-ar2fa_ar2fa_quran_bleu":0.157067121},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1298447221,"summarization_PnSummary_rougeL_recall":0.3548911672,"summarization_PnSummary_rougeL_f1_score":0.1841564462},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0852951832,"translation-fa2ar_fa2ar_nahj_bleu":0.0464072569,"translation-fa2ar_fa2ar_sahife_bleu":0.0713426227,"translation-fa2ar_fa2ar_quran_bleu":0.1381356701},"nlg_score":0.1641995602}
         | 
| 16 | 
             
            {"Model Name":"Qwen3-30B-A3B","thinking_method":"β","model_url":"https_google.com","parameters_count":"30500000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1996840686,"question-generation_PersianQA_rougeL_recall":0.3393114266,"question-generation_PersianQA_rougeL_f1_score":0.2417040176},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1617787549,"translation-en2fa_en2fa_epoque_bleu":0.3821529147,"translation-en2fa_en2fa_mizan_bleu":0.1337537913,"translation-en2fa_en2fa_quran_bleu":0.0860909143,"translation-en2fa_en2fa_sahife_bleu":0.0770506908,"translation-en2fa_en2fa_nahj_bleu":0.0441728515,"translation-en2fa_en2fa_tep_bleu":0.0587014819},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1523824175,"summarization_SamSUM-fa_rougeL_recall":0.3838683519,"summarization_SamSUM-fa_rougeL_f1_score":0.2083553767},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2177785793,"translation-fa2en_fa2en_tep_bleu":0.1189948472,"translation-fa2en_fa2en_mizan_bleu":0.1793626928,"translation-fa2en_fa2en_quran_bleu":0.1718006478,"translation-fa2en_fa2en_epoque_bleu":0.4500382308,"translation-fa2en_fa2en_nahj_bleu":0.0836776138,"translation-fa2en_fa2en_sahife_bleu":0.1034067477},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.090408759,"translation-ar2fa_ar2fa_sahife_bleu":0.0778953352,"translation-ar2fa_ar2fa_nahj_bleu":0.0610049198,"translation-ar2fa_ar2fa_quran_bleu":0.13085583},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1212751301,"summarization_PnSummary_rougeL_recall":0.3923323141,"summarization_PnSummary_rougeL_f1_score":0.1804727387},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0483297895,"translation-fa2ar_fa2ar_nahj_bleu":0.0310247441,"translation-fa2ar_fa2ar_sahife_bleu":0.0512375201,"translation-fa2ar_fa2ar_quran_bleu":0.0627271043},"nlg_score":0.164118288}
         | 
| 17 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https_google.com","parameters_count":"14800000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1987198912,"question-generation_PersianQA_rougeL_recall":0.3431437262,"question-generation_PersianQA_rougeL_f1_score":0.2419384398},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1535253787,"translation-en2fa_en2fa_epoque_bleu":0.3553678809,"translation-en2fa_en2fa_mizan_bleu":0.1285441922,"translation-en2fa_en2fa_quran_bleu":0.0857809616,"translation-en2fa_en2fa_sahife_bleu":0.0787025343,"translation-en2fa_en2fa_nahj_bleu":0.0404850935,"translation-en2fa_en2fa_tep_bleu":0.0586129062},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1469468837,"summarization_SamSUM-fa_rougeL_recall":0.3743807014,"summarization_SamSUM-fa_rougeL_f1_score":0.2022859929},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2145488085,"translation-fa2en_fa2en_tep_bleu":0.1307272464,"translation-fa2en_fa2en_mizan_bleu":0.1697754862,"translation-fa2en_fa2en_quran_bleu":0.1552415558,"translation-fa2en_fa2en_epoque_bleu":0.4513682579,"translation-fa2en_fa2en_nahj_bleu":0.0842673472,"translation-fa2en_fa2en_sahife_bleu":0.0853787118},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0910450298,"translation-ar2fa_ar2fa_sahife_bleu":0.0862679894,"translation-ar2fa_ar2fa_nahj_bleu":0.0558129824,"translation-ar2fa_ar2fa_quran_bleu":0.1292925153},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1123870374,"summarization_PnSummary_rougeL_recall":0.4032007327,"summarization_PnSummary_rougeL_f1_score":0.17115848},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0494411806,"translation-fa2ar_fa2ar_nahj_bleu":0.0369805868,"translation-fa2ar_fa2ar_sahife_bleu":0.0567654991,"translation-fa2ar_fa2ar_quran_bleu":0.0545774559},"nlg_score":0.16056333}
         | 
| 18 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https_google.com","parameters_count":"109000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1572445395,"question-generation_PersianQA_rougeL_recall":0.2651515671,"question-generation_PersianQA_rougeL_f1_score":0.1889377754},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1694667296,"translation-en2fa_en2fa_epoque_bleu":0.3980975238,"translation-en2fa_en2fa_mizan_bleu":0.1400810731,"translation-en2fa_en2fa_quran_bleu":0.1173019123,"translation-en2fa_en2fa_sahife_bleu":0.0758825134,"translation-en2fa_en2fa_nahj_bleu":0.0380397952,"translation-en2fa_en2fa_tep_bleu":0.05711699},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1539866165,"summarization_SamSUM-fa_rougeL_recall":0.341409574,"summarization_SamSUM-fa_rougeL_f1_score":0.2007085976},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1909462413,"translation-fa2en_fa2en_tep_bleu":0.1038996524,"translation-fa2en_fa2en_mizan_bleu":0.1513900262,"translation-fa2en_fa2en_quran_bleu":0.129609905,"translation-fa2en_fa2en_epoque_bleu":0.4266734606,"translation-fa2en_fa2en_nahj_bleu":0.0619630431,"translation-fa2en_fa2en_sahife_bleu":0.0584029483},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0997661237,"translation-ar2fa_ar2fa_sahife_bleu":0.0880416079,"translation-ar2fa_ar2fa_nahj_bleu":0.0425251453,"translation-ar2fa_ar2fa_quran_bleu":0.165869569},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1377053282,"summarization_PnSummary_rougeL_recall":0.380073051,"summarization_PnSummary_rougeL_f1_score":0.1928750247},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0548753777,"translation-fa2ar_fa2ar_nahj_bleu":0.0318327001,"translation-fa2ar_fa2ar_sahife_bleu":0.0567893259,"translation-fa2ar_fa2ar_quran_bleu":0.076004107},"nlg_score":0.1567965528}
         | 
| 19 | 
             
            {"Model Name":"Qwen3-8B","thinking_method":"β","model_url":"https_google.com","parameters_count":"8190000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1965366702,"question-generation_PersianQA_rougeL_recall":0.340760284,"question-generation_PersianQA_rougeL_f1_score":0.2388923895},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1550276898,"translation-en2fa_en2fa_epoque_bleu":0.3721582216,"translation-en2fa_en2fa_mizan_bleu":0.1231599039,"translation-en2fa_en2fa_quran_bleu":0.0882213453,"translation-en2fa_en2fa_sahife_bleu":0.0725213197,"translation-en2fa_en2fa_nahj_bleu":0.0424186358,"translation-en2fa_en2fa_tep_bleu":0.0528718634},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1463365551,"summarization_SamSUM-fa_rougeL_recall":0.3856017289,"summarization_SamSUM-fa_rougeL_f1_score":0.2024070197},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.2024225184,"translation-fa2en_fa2en_tep_bleu":0.1163127945,"translation-fa2en_fa2en_mizan_bleu":0.1649009947,"translation-fa2en_fa2en_quran_bleu":0.1513328968,"translation-fa2en_fa2en_epoque_bleu":0.4171232399,"translation-fa2en_fa2en_nahj_bleu":0.0857999462,"translation-fa2en_fa2en_sahife_bleu":0.0929479364},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0821020713,"translation-ar2fa_ar2fa_sahife_bleu":0.0730469461,"translation-ar2fa_ar2fa_nahj_bleu":0.0579031327,"translation-ar2fa_ar2fa_quran_bleu":0.1141461882},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.109255822,"summarization_PnSummary_rougeL_recall":0.3979273385,"summarization_PnSummary_rougeL_f1_score":0.1669061111},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0423318046,"translation-fa2ar_fa2ar_nahj_bleu":0.0329089717,"translation-fa2ar_fa2ar_sahife_bleu":0.0445101244,"translation-fa2ar_fa2ar_quran_bleu":0.0495763178},"nlg_score":0.1557270864}
         | 
| 20 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2002927511,"question-generation_PersianQA_rougeL_recall":0.3328639596,"question-generation_PersianQA_rougeL_f1_score":0.2391789869},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1608795131,"translation-en2fa_en2fa_epoque_bleu":0.3578688062,"translation-en2fa_en2fa_mizan_bleu":0.1485917499,"translation-en2fa_en2fa_quran_bleu":0.094218512,"translation-en2fa_en2fa_sahife_bleu":0.0778161632,"translation-en2fa_en2fa_nahj_bleu":0.0434765061,"translation-en2fa_en2fa_tep_bleu":0.0618688381},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1158613629,"summarization_SamSUM-fa_rougeL_recall":0.3578031642,"summarization_SamSUM-fa_rougeL_f1_score":0.168058919},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1889897396,"translation-fa2en_fa2en_tep_bleu":0.1330232097,"translation-fa2en_fa2en_mizan_bleu":0.1552418193,"translation-fa2en_fa2en_quran_bleu":0.1151586178,"translation-fa2en_fa2en_epoque_bleu":0.3895907069,"translation-fa2en_fa2en_nahj_bleu":0.0701778462,"translation-fa2en_fa2en_sahife_bleu":0.0722357071},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0975905866,"translation-ar2fa_ar2fa_sahife_bleu":0.0824300354,"translation-ar2fa_ar2fa_nahj_bleu":0.0513812903,"translation-ar2fa_ar2fa_quran_bleu":0.1566499693},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.0783955467,"summarization_PnSummary_rougeL_recall":0.3671775126,"summarization_PnSummary_rougeL_f1_score":0.1256898612},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0374749811,"translation-fa2ar_fa2ar_nahj_bleu":0.0275129836,"translation-fa2ar_fa2ar_sahife_bleu":0.0412173132,"translation-fa2ar_fa2ar_quran_bleu":0.0436946465},"nlg_score":0.1454089411}
         | 
| 21 | 
             
            {"Model Name":"Qwen3-4B","thinking_method":"β","model_url":"https_google.com","parameters_count":"4020000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1744197112,"question-generation_PersianQA_rougeL_recall":0.2697024508,"question-generation_PersianQA_rougeL_f1_score":0.2017710943},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1217211215,"translation-en2fa_en2fa_epoque_bleu":0.2916268514,"translation-en2fa_en2fa_mizan_bleu":0.091925603,"translation-en2fa_en2fa_quran_bleu":0.065498518,"translation-en2fa_en2fa_sahife_bleu":0.0612237455,"translation-en2fa_en2fa_nahj_bleu":0.0385824628,"translation-en2fa_en2fa_tep_bleu":0.0453883692},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1429609514,"summarization_SamSUM-fa_rougeL_recall":0.397717388,"summarization_SamSUM-fa_rougeL_f1_score":0.2013136641},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1840809218,"translation-fa2en_fa2en_tep_bleu":0.1011436783,"translation-fa2en_fa2en_mizan_bleu":0.149157222,"translation-fa2en_fa2en_quran_bleu":0.1377761662,"translation-fa2en_fa2en_epoque_bleu":0.3802946233,"translation-fa2en_fa2en_nahj_bleu":0.0851756367,"translation-fa2en_fa2en_sahife_bleu":0.0857201524},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0636385541,"translation-ar2fa_ar2fa_sahife_bleu":0.0557180428,"translation-ar2fa_ar2fa_nahj_bleu":0.0539968488,"translation-ar2fa_ar2fa_quran_bleu":0.0807186853},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1067208324,"summarization_PnSummary_rougeL_recall":0.4109136551,"summarization_PnSummary_rougeL_f1_score":0.1648475797},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0351351131,"translation-fa2ar_fa2ar_nahj_bleu":0.0313503027,"translation-fa2ar_fa2ar_sahife_bleu":0.042075565,"translation-fa2ar_fa2ar_quran_bleu":0.0319794715},"nlg_score":0.1389297212}
         | 
| 22 | 
             
            {"Model Name":"gemini-2.5-flash","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"N\/A","source_type":"Closed-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.3121385499,"question-generation_PersianQA_rougeL_recall":0.4162991047,"question-generation_PersianQA_rougeL_f1_score":0.3445136596},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.0650794176,"translation-en2fa_en2fa_epoque_bleu":0.1194375779,"translation-en2fa_en2fa_mizan_bleu":0.0640649978,"translation-en2fa_en2fa_quran_bleu":0.0926514743,"translation-en2fa_en2fa_sahife_bleu":0.0392464347,"translation-en2fa_en2fa_nahj_bleu":0.022322883,"translation-en2fa_en2fa_tep_bleu":0.0184227674},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1525978605,"summarization_SamSUM-fa_rougeL_recall":0.3945587249,"summarization_SamSUM-fa_rougeL_f1_score":0.209852471},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0559484689,"translation-fa2en_fa2en_tep_bleu":0.0190401646,"translation-fa2en_fa2en_mizan_bleu":0.0369126121,"translation-fa2en_fa2en_quran_bleu":0.0401048971,"translation-fa2en_fa2en_epoque_bleu":0.1381975553,"translation-fa2en_fa2en_nahj_bleu":0.0232788817,"translation-fa2en_fa2en_sahife_bleu":0.017477039},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0772188097,"translation-ar2fa_ar2fa_sahife_bleu":0.0610321929,"translation-ar2fa_ar2fa_nahj_bleu":0.0273061824,"translation-ar2fa_ar2fa_quran_bleu":0.1408224224},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1070140366,"summarization_PnSummary_rougeL_recall":0.4357356292,"summarization_PnSummary_rougeL_f1_score":0.1672508999},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0382543341,"translation-fa2ar_fa2ar_nahj_bleu":0.032191006,"translation-fa2ar_fa2ar_sahife_bleu":0.028980881,"translation-fa2ar_fa2ar_quran_bleu":0.0535911152},"nlg_score":0.1368740087}
         | 
| 23 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https_google.com","parameters_count":"20000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1877254615,"question-generation_PersianQA_rougeL_recall":0.3036923298,"question-generation_PersianQA_rougeL_f1_score":0.2215402117},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1482164359,"translation-en2fa_en2fa_epoque_bleu":0.3332313032,"translation-en2fa_en2fa_mizan_bleu":0.1348649993,"translation-en2fa_en2fa_quran_bleu":0.0798910499,"translation-en2fa_en2fa_sahife_bleu":0.0724923326,"translation-en2fa_en2fa_nahj_bleu":0.0425031053,"translation-en2fa_en2fa_tep_bleu":0.0570157331},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1076131004,"summarization_SamSUM-fa_rougeL_recall":0.354952604,"summarization_SamSUM-fa_rougeL_f1_score":0.1578241504},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1811060704,"translation-fa2en_fa2en_tep_bleu":0.1180786789,"translation-fa2en_fa2en_mizan_bleu":0.1503794353,"translation-fa2en_fa2en_quran_bleu":0.1042682142,"translation-fa2en_fa2en_epoque_bleu":0.3794274854,"translation-fa2en_fa2en_nahj_bleu":0.0641545233,"translation-fa2en_fa2en_sahife_bleu":0.0772362522},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0704966071,"translation-ar2fa_ar2fa_sahife_bleu":0.0675578984,"translation-ar2fa_ar2fa_nahj_bleu":0.042116411,"translation-ar2fa_ar2fa_quran_bleu":0.1003965021},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.0796516779,"summarization_PnSummary_rougeL_recall":0.3573917363,"summarization_PnSummary_rougeL_f1_score":0.1263677591},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0287298887,"translation-fa2ar_fa2ar_nahj_bleu":0.025061663,"translation-fa2ar_fa2ar_sahife_bleu":0.0355711393,"translation-fa2ar_fa2ar_quran_bleu":0.0255568639},"nlg_score":0.1334687319}
         | 
| 24 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https_google.com","parameters_count":"24000000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.1520819517,"question-generation_PersianQA_rougeL_recall":0.26324767,"question-generation_PersianQA_rougeL_f1_score":0.1843401988},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.1458447378,"translation-en2fa_en2fa_epoque_bleu":0.3541508677,"translation-en2fa_en2fa_mizan_bleu":0.1259468635,"translation-en2fa_en2fa_quran_bleu":0.0887225632,"translation-en2fa_en2fa_sahife_bleu":0.0672732746,"translation-en2fa_en2fa_nahj_bleu":0.0407327793,"translation-en2fa_en2fa_tep_bleu":0.0293172873},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.147286408,"summarization_SamSUM-fa_rougeL_recall":0.4066657958,"summarization_SamSUM-fa_rougeL_f1_score":0.2072278176},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.1451163884,"translation-fa2en_fa2en_tep_bleu":0.0393307601,"translation-fa2en_fa2en_mizan_bleu":0.1009347025,"translation-fa2en_fa2en_quran_bleu":0.0929688918,"translation-fa2en_fa2en_epoque_bleu":0.3660914464,"translation-fa2en_fa2en_nahj_bleu":0.0536507876,"translation-fa2en_fa2en_sahife_bleu":0.05038339},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0594554675,"translation-ar2fa_ar2fa_sahife_bleu":0.0539986603,"translation-ar2fa_ar2fa_nahj_bleu":0.035240584,"translation-ar2fa_ar2fa_quran_bleu":0.0879164142},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1029257145,"summarization_PnSummary_rougeL_recall":0.4347811424,"summarization_PnSummary_rougeL_f1_score":0.1621438757},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0192357288,"translation-fa2ar_fa2ar_nahj_bleu":0.0151369319,"translation-fa2ar_fa2ar_sahife_bleu":0.0245784397,"translation-fa2ar_fa2ar_quran_bleu":0.0179918148},"nlg_score":0.1319091735}
         | 
| 25 | 
             
            {"Model Name":"gemma-3-12b-it","thinking_method":"β","model_url":"https_google.com","parameters_count":"12200000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.2572991833,"question-generation_PersianQA_rougeL_recall":0.3740225235,"question-generation_PersianQA_rougeL_f1_score":0.2927586837},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.08817485,"translation-en2fa_en2fa_epoque_bleu":0.1886801725,"translation-en2fa_en2fa_mizan_bleu":0.0879987558,"translation-en2fa_en2fa_quran_bleu":0.0657922023,"translation-en2fa_en2fa_sahife_bleu":0.0296141618,"translation-en2fa_en2fa_nahj_bleu":0.0192266597,"translation-en2fa_en2fa_tep_bleu":0.0366296874},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1658145118,"summarization_SamSUM-fa_rougeL_recall":0.3677760479,"summarization_SamSUM-fa_rougeL_f1_score":0.2189237562},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.0257184881,"translation-fa2en_fa2en_tep_bleu":0.011593122,"translation-fa2en_fa2en_mizan_bleu":0.0215328963,"translation-fa2en_fa2en_quran_bleu":0.0262056878,"translation-fa2en_fa2en_epoque_bleu":0.047221295,"translation-fa2en_fa2en_nahj_bleu":0.0178557856,"translation-fa2en_fa2en_sahife_bleu":0.0169922826},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.032619077,"translation-ar2fa_ar2fa_sahife_bleu":0.0333185867,"translation-ar2fa_ar2fa_nahj_bleu":0.0106299838,"translation-ar2fa_ar2fa_quran_bleu":0.0528092057},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1156871575,"summarization_PnSummary_rougeL_recall":0.3630716995,"summarization_PnSummary_rougeL_f1_score":0.1697348346},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0098333287,"translation-fa2ar_fa2ar_nahj_bleu":0.0072190824,"translation-fa2ar_fa2ar_sahife_bleu":0.0110570977,"translation-fa2ar_fa2ar_quran_bleu":0.0112238061},"nlg_score":0.1196804312}
         | 
| 26 | 
             
            {"Model Name":"aya-expanse-32b","thinking_method":"β","model_url":"https_google.com","parameters_count":"32300000000","source_type":"Open-Source","question-generation_PersianQA":{"question-generation_PersianQA_rougeL_precision":0.0980160864,"question-generation_PersianQA_rougeL_recall":0.347983913,"question-generation_PersianQA_rougeL_f1_score":0.1443872083},"translation-en2fa_en2fa":{"translation-en2fa_en2fa_bleu":0.0951102411,"translation-en2fa_en2fa_epoque_bleu":0.2204131973,"translation-en2fa_en2fa_mizan_bleu":0.0772021612,"translation-en2fa_en2fa_quran_bleu":0.0914129011,"translation-en2fa_en2fa_sahife_bleu":0.0555605793,"translation-en2fa_en2fa_nahj_bleu":0.0296371925,"translation-en2fa_en2fa_tep_bleu":0.0145962694},"summarization_SamSUM-fa":{"summarization_SamSUM-fa_rougeL_precision":0.1338082958,"summarization_SamSUM-fa_rougeL_recall":0.397938928,"summarization_SamSUM-fa_rougeL_f1_score":0.1933390916},"translation-fa2en_fa2en":{"translation-fa2en_fa2en_bleu":0.14443262,"translation-fa2en_fa2en_tep_bleu":0.0636878051,"translation-fa2en_fa2en_mizan_bleu":0.1045784226,"translation-fa2en_fa2en_quran_bleu":0.1065169191,"translation-fa2en_fa2en_epoque_bleu":0.3331896819,"translation-fa2en_fa2en_nahj_bleu":0.0573420672,"translation-fa2en_fa2en_sahife_bleu":0.0526154809},"translation-ar2fa_ar2fa":{"translation-ar2fa_ar2fa_bleu":0.0608470749,"translation-ar2fa_ar2fa_sahife_bleu":0.0636783644,"translation-ar2fa_ar2fa_nahj_bleu":0.0258604511,"translation-ar2fa_ar2fa_quran_bleu":0.091253078},"summarization_PnSummary":{"summarization_PnSummary_rougeL_precision":0.1094933227,"summarization_PnSummary_rougeL_recall":0.3979476995,"summarization_PnSummary_rougeL_f1_score":0.1674664883},"translation-fa2ar_fa2ar":{"translation-fa2ar_fa2ar_bleu":0.0318976507,"translation-fa2ar_fa2ar_nahj_bleu":0.0222927973,"translation-fa2ar_fa2ar_sahife_bleu":0.0296757253,"translation-fa2ar_fa2ar_quran_bleu":0.0437244293},"nlg_score":0.1196400535}
         | 
    	
        leaderboard/boards_data/persian_nlu.jsonl
    CHANGED
    
    | The diff for this file is too large to render. 
		See raw diff | 
|  | 
    	
        leaderboard/boards_data/question-generation_PersianQA.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.1693490122,"question-generation_PersianQA_rougeL_recall":0.3886090827,"question-generation_PersianQA_rougeL_f1_score":0.227277052,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1704020873,"question-generation_PersianQA_rougeL_recall":0.3000756202,"question-generation_PersianQA_rougeL_f1_score":0.2079039891,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2149535143,"question-generation_PersianQA_rougeL_recall":0.3019561885,"question-generation_PersianQA_rougeL_f1_score":0.2405115465,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1365997259,"question-generation_PersianQA_rougeL_recall":0.3257934111,"question-generation_PersianQA_rougeL_f1_score":0.1803398036,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.2576021626,"question-generation_PersianQA_rougeL_recall":0.3924501003,"question-generation_PersianQA_rougeL_f1_score":0.2985826349,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":null,"question-generation_PersianQA_rougeL_recall":null,"question-generation_PersianQA_rougeL_f1_score":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2041596361,"question-generation_PersianQA_rougeL_recall":0.3456815337,"question-generation_PersianQA_rougeL_f1_score":0.2459732807,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1987198912,"question-generation_PersianQA_rougeL_recall":0.3431437262,"question-generation_PersianQA_rougeL_f1_score":0.2419384398,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2281053588,"question-generation_PersianQA_rougeL_recall":0.370933314,"question-generation_PersianQA_rougeL_f1_score":0.273363418,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.0870939736,"question-generation_PersianQA_rougeL_recall":0.3600941065,"question-generation_PersianQA_rougeL_f1_score":0.1336375958,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1520819517,"question-generation_PersianQA_rougeL_recall":0.26324767,"question-generation_PersianQA_rougeL_f1_score":0.1843401988,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1669255457,"question-generation_PersianQA_rougeL_recall":0.2952488346,"question-generation_PersianQA_rougeL_f1_score":0.2007786564,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.1693490122,"question-generation_PersianQA_rougeL_recall":0.3886090827,"question-generation_PersianQA_rougeL_f1_score":0.227277052,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1877254615,"question-generation_PersianQA_rougeL_recall":0.3036923298,"question-generation_PersianQA_rougeL_f1_score":0.2215402117,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1704020873,"question-generation_PersianQA_rougeL_recall":0.3000756202,"question-generation_PersianQA_rougeL_f1_score":0.2079039891,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2149535143,"question-generation_PersianQA_rougeL_recall":0.3019561885,"question-generation_PersianQA_rougeL_f1_score":0.2405115465,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.2602516122,"question-generation_PersianQA_rougeL_recall":0.3803807526,"question-generation_PersianQA_rougeL_f1_score":0.2967852302,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.2221178335,"question-generation_PersianQA_rougeL_recall":0.335306645,"question-generation_PersianQA_rougeL_f1_score":0.2552875817,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2002927511,"question-generation_PersianQA_rougeL_recall":0.3328639596,"question-generation_PersianQA_rougeL_f1_score":0.2391789869,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1365997259,"question-generation_PersianQA_rougeL_recall":0.3257934111,"question-generation_PersianQA_rougeL_f1_score":0.1803398036,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.2576021626,"question-generation_PersianQA_rougeL_recall":0.3924501003,"question-generation_PersianQA_rougeL_f1_score":0.2985826349,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":null,"question-generation_PersianQA_rougeL_recall":null,"question-generation_PersianQA_rougeL_f1_score":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2041596361,"question-generation_PersianQA_rougeL_recall":0.3456815337,"question-generation_PersianQA_rougeL_f1_score":0.2459732807,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1987198912,"question-generation_PersianQA_rougeL_recall":0.3431437262,"question-generation_PersianQA_rougeL_f1_score":0.2419384398,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.2281053588,"question-generation_PersianQA_rougeL_recall":0.370933314,"question-generation_PersianQA_rougeL_f1_score":0.273363418,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1572445395,"question-generation_PersianQA_rougeL_recall":0.2651515671,"question-generation_PersianQA_rougeL_f1_score":0.1889377754,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","question-generation_PersianQA_rougeL_precision":0.0870939736,"question-generation_PersianQA_rougeL_recall":0.3600941065,"question-generation_PersianQA_rougeL_f1_score":0.1336375958,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1520819517,"question-generation_PersianQA_rougeL_recall":0.26324767,"question-generation_PersianQA_rougeL_f1_score":0.1843401988,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","question-generation_PersianQA_rougeL_precision":0.1669255457,"question-generation_PersianQA_rougeL_recall":0.2952488346,"question-generation_PersianQA_rougeL_f1_score":0.2007786564,"nlg_score":0.112015688}
         | 
    	
        leaderboard/boards_data/sentiment-analysis_deepsentipers.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.8058409951,"sentiment-analysis_deepsentipers_precision_modified":0.7717795715,"sentiment-analysis_deepsentipers_recall_modified":0.8211827366,"sentiment-analysis_deepsentipers_fscore_modified":0.7889064935,"sentiment-analysis_deepsentipers_acc":0.8062770563,"sentiment-analysis_deepsentipers_precision":0.7721972011,"sentiment-analysis_deepsentipers_recall":0.8216270995,"sentiment-analysis_deepsentipers_fscore":0.7893333909,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9994591671,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.6817691478,"sentiment-analysis_deepsentipers_precision_modified":0.6546744642,"sentiment-analysis_deepsentipers_recall_modified":0.7378694789,"sentiment-analysis_deepsentipers_fscore_modified":0.6356142977,"sentiment-analysis_deepsentipers_acc":0.6817691478,"sentiment-analysis_deepsentipers_precision":0.6546744642,"sentiment-analysis_deepsentipers_recall":0.7378694789,"sentiment-analysis_deepsentipers_fscore":0.6356142977,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.738403452,"sentiment-analysis_deepsentipers_precision_modified":0.706763853,"sentiment-analysis_deepsentipers_recall_modified":0.7658510846,"sentiment-analysis_deepsentipers_fscore_modified":0.726373242,"sentiment-analysis_deepsentipers_acc":0.738403452,"sentiment-analysis_deepsentipers_precision":0.706763853,"sentiment-analysis_deepsentipers_recall":0.7658510846,"sentiment-analysis_deepsentipers_fscore":0.726373242,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7518878101,"sentiment-analysis_deepsentipers_precision_modified":0.7333601788,"sentiment-analysis_deepsentipers_recall_modified":0.7850018857,"sentiment-analysis_deepsentipers_fscore_modified":0.7214827861,"sentiment-analysis_deepsentipers_acc":0.752293578,"sentiment-analysis_deepsentipers_precision":0.7337559479,"sentiment-analysis_deepsentipers_recall":0.785425524,"sentiment-analysis_deepsentipers_fscore":0.7218721454,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9994606257,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.8047464941,"sentiment-analysis_deepsentipers_precision_modified":0.7661826532,"sentiment-analysis_deepsentipers_recall_modified":0.8089861144,"sentiment-analysis_deepsentipers_fscore_modified":0.7830417049,"sentiment-analysis_deepsentipers_acc":0.8047464941,"sentiment-analysis_deepsentipers_precision":0.7661826532,"sentiment-analysis_deepsentipers_recall":0.8089861144,"sentiment-analysis_deepsentipers_fscore":0.7830417049,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":null,"sentiment-analysis_deepsentipers_precision_modified":null,"sentiment-analysis_deepsentipers_recall_modified":null,"sentiment-analysis_deepsentipers_fscore_modified":null,"sentiment-analysis_deepsentipers_acc":null,"sentiment-analysis_deepsentipers_precision":null,"sentiment-analysis_deepsentipers_recall":null,"sentiment-analysis_deepsentipers_fscore":null,"sentiment-analysis_deepsentipers_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7556634304,"sentiment-analysis_deepsentipers_precision_modified":0.7100962569,"sentiment-analysis_deepsentipers_recall_modified":0.796296032,"sentiment-analysis_deepsentipers_fscore_modified":0.7198160026,"sentiment-analysis_deepsentipers_acc":0.7556634304,"sentiment-analysis_deepsentipers_precision":0.7100962569,"sentiment-analysis_deepsentipers_recall":0.796296032,"sentiment-analysis_deepsentipers_fscore":0.7198160026,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7459546926,"sentiment-analysis_deepsentipers_precision_modified":0.696002467,"sentiment-analysis_deepsentipers_recall_modified":0.7725731976,"sentiment-analysis_deepsentipers_fscore_modified":0.7160207999,"sentiment-analysis_deepsentipers_acc":0.7459546926,"sentiment-analysis_deepsentipers_precision":0.696002467,"sentiment-analysis_deepsentipers_recall":0.7725731976,"sentiment-analysis_deepsentipers_fscore":0.7160207999,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7820927724,"sentiment-analysis_deepsentipers_precision_modified":0.7592820571,"sentiment-analysis_deepsentipers_recall_modified":0.7768252647,"sentiment-analysis_deepsentipers_fscore_modified":0.7562669975,"sentiment-analysis_deepsentipers_acc":0.7820927724,"sentiment-analysis_deepsentipers_precision":0.7592820571,"sentiment-analysis_deepsentipers_recall":0.7768252647,"sentiment-analysis_deepsentipers_fscore":0.7562669975,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.7521691974,"sentiment-analysis_deepsentipers_precision_modified":0.7149147283,"sentiment-analysis_deepsentipers_recall_modified":0.7661218172,"sentiment-analysis_deepsentipers_fscore_modified":0.7340307684,"sentiment-analysis_deepsentipers_acc":0.7550353838,"sentiment-analysis_deepsentipers_precision":0.7176389542,"sentiment-analysis_deepsentipers_recall":0.7690411709,"sentiment-analysis_deepsentipers_fscore":0.7368278372,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9962039046,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.5949298813,"sentiment-analysis_deepsentipers_precision_modified":0.6633283768,"sentiment-analysis_deepsentipers_recall_modified":0.6739827327,"sentiment-analysis_deepsentipers_fscore_modified":0.597099001,"sentiment-analysis_deepsentipers_acc":0.5958941113,"sentiment-analysis_deepsentipers_precision":0.6644034633,"sentiment-analysis_deepsentipers_recall":0.6750750872,"sentiment-analysis_deepsentipers_fscore":0.5980667466,"sentiment-analysis_deepsentipers_valid_output_ratio":0.998381877,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7038834951,"sentiment-analysis_deepsentipers_precision_modified":0.6558175114,"sentiment-analysis_deepsentipers_recall_modified":0.7195323034,"sentiment-analysis_deepsentipers_fscore_modified":0.6634075099,"sentiment-analysis_deepsentipers_acc":0.7038834951,"sentiment-analysis_deepsentipers_precision":0.6558175114,"sentiment-analysis_deepsentipers_recall":0.7195323034,"sentiment-analysis_deepsentipers_fscore":0.6634075099,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.8058409951,"sentiment-analysis_deepsentipers_precision_modified":0.7717795715,"sentiment-analysis_deepsentipers_recall_modified":0.8211827366,"sentiment-analysis_deepsentipers_fscore_modified":0.7889064935,"sentiment-analysis_deepsentipers_acc":0.8062770563,"sentiment-analysis_deepsentipers_precision":0.7721972011,"sentiment-analysis_deepsentipers_recall":0.8216270995,"sentiment-analysis_deepsentipers_fscore":0.7893333909,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9994591671,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7421790723,"sentiment-analysis_deepsentipers_precision_modified":0.705605232,"sentiment-analysis_deepsentipers_recall_modified":0.7565637786,"sentiment-analysis_deepsentipers_fscore_modified":0.7108099837,"sentiment-analysis_deepsentipers_acc":0.7674288901,"sentiment-analysis_deepsentipers_precision":0.7296107642,"sentiment-analysis_deepsentipers_recall":0.7823029813,"sentiment-analysis_deepsentipers_fscore":0.7349925877,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9670981661,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.6817691478,"sentiment-analysis_deepsentipers_precision_modified":0.6546744642,"sentiment-analysis_deepsentipers_recall_modified":0.7378694789,"sentiment-analysis_deepsentipers_fscore_modified":0.6356142977,"sentiment-analysis_deepsentipers_acc":0.6817691478,"sentiment-analysis_deepsentipers_precision":0.6546744642,"sentiment-analysis_deepsentipers_recall":0.7378694789,"sentiment-analysis_deepsentipers_fscore":0.6356142977,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.738403452,"sentiment-analysis_deepsentipers_precision_modified":0.706763853,"sentiment-analysis_deepsentipers_recall_modified":0.7658510846,"sentiment-analysis_deepsentipers_fscore_modified":0.726373242,"sentiment-analysis_deepsentipers_acc":0.738403452,"sentiment-analysis_deepsentipers_precision":0.706763853,"sentiment-analysis_deepsentipers_recall":0.7658510846,"sentiment-analysis_deepsentipers_fscore":0.726373242,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.806364617,"sentiment-analysis_deepsentipers_precision_modified":0.7705568258,"sentiment-analysis_deepsentipers_recall_modified":0.8234753765,"sentiment-analysis_deepsentipers_fscore_modified":0.7802386366,"sentiment-analysis_deepsentipers_acc":0.806364617,"sentiment-analysis_deepsentipers_precision":0.7705568258,"sentiment-analysis_deepsentipers_recall":0.8234753765,"sentiment-analysis_deepsentipers_fscore":0.7802386366,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.7885652643,"sentiment-analysis_deepsentipers_precision_modified":0.757057239,"sentiment-analysis_deepsentipers_recall_modified":0.8134053732,"sentiment-analysis_deepsentipers_fscore_modified":0.7618040556,"sentiment-analysis_deepsentipers_acc":0.7911255411,"sentiment-analysis_deepsentipers_precision":0.7595152171,"sentiment-analysis_deepsentipers_recall":0.8160462998,"sentiment-analysis_deepsentipers_fscore":0.7642774453,"sentiment-analysis_deepsentipers_valid_output_ratio":0.996763754,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7837108954,"sentiment-analysis_deepsentipers_precision_modified":0.7439934995,"sentiment-analysis_deepsentipers_recall_modified":0.8027830842,"sentiment-analysis_deepsentipers_fscore_modified":0.7554845169,"sentiment-analysis_deepsentipers_acc":0.7849810913,"sentiment-analysis_deepsentipers_precision":0.7451993237,"sentiment-analysis_deepsentipers_recall":0.8040841913,"sentiment-analysis_deepsentipers_fscore":0.7567089651,"sentiment-analysis_deepsentipers_valid_output_ratio":0.998381877,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7518878101,"sentiment-analysis_deepsentipers_precision_modified":0.7333601788,"sentiment-analysis_deepsentipers_recall_modified":0.7850018857,"sentiment-analysis_deepsentipers_fscore_modified":0.7214827861,"sentiment-analysis_deepsentipers_acc":0.752293578,"sentiment-analysis_deepsentipers_precision":0.7337559479,"sentiment-analysis_deepsentipers_recall":0.785425524,"sentiment-analysis_deepsentipers_fscore":0.7218721454,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9994606257,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.8047464941,"sentiment-analysis_deepsentipers_precision_modified":0.7661826532,"sentiment-analysis_deepsentipers_recall_modified":0.8089861144,"sentiment-analysis_deepsentipers_fscore_modified":0.7830417049,"sentiment-analysis_deepsentipers_acc":0.8047464941,"sentiment-analysis_deepsentipers_precision":0.7661826532,"sentiment-analysis_deepsentipers_recall":0.8089861144,"sentiment-analysis_deepsentipers_fscore":0.7830417049,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":null,"sentiment-analysis_deepsentipers_precision_modified":null,"sentiment-analysis_deepsentipers_recall_modified":null,"sentiment-analysis_deepsentipers_fscore_modified":null,"sentiment-analysis_deepsentipers_acc":null,"sentiment-analysis_deepsentipers_precision":null,"sentiment-analysis_deepsentipers_recall":null,"sentiment-analysis_deepsentipers_fscore":null,"sentiment-analysis_deepsentipers_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7556634304,"sentiment-analysis_deepsentipers_precision_modified":0.7100962569,"sentiment-analysis_deepsentipers_recall_modified":0.796296032,"sentiment-analysis_deepsentipers_fscore_modified":0.7198160026,"sentiment-analysis_deepsentipers_acc":0.7556634304,"sentiment-analysis_deepsentipers_precision":0.7100962569,"sentiment-analysis_deepsentipers_recall":0.796296032,"sentiment-analysis_deepsentipers_fscore":0.7198160026,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7459546926,"sentiment-analysis_deepsentipers_precision_modified":0.696002467,"sentiment-analysis_deepsentipers_recall_modified":0.7725731976,"sentiment-analysis_deepsentipers_fscore_modified":0.7160207999,"sentiment-analysis_deepsentipers_acc":0.7459546926,"sentiment-analysis_deepsentipers_precision":0.696002467,"sentiment-analysis_deepsentipers_recall":0.7725731976,"sentiment-analysis_deepsentipers_fscore":0.7160207999,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7820927724,"sentiment-analysis_deepsentipers_precision_modified":0.7592820571,"sentiment-analysis_deepsentipers_recall_modified":0.7768252647,"sentiment-analysis_deepsentipers_fscore_modified":0.7562669975,"sentiment-analysis_deepsentipers_acc":0.7820927724,"sentiment-analysis_deepsentipers_precision":0.7592820571,"sentiment-analysis_deepsentipers_recall":0.7768252647,"sentiment-analysis_deepsentipers_fscore":0.7562669975,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.715210356,"sentiment-analysis_deepsentipers_precision_modified":0.6703215936,"sentiment-analysis_deepsentipers_recall_modified":0.7384303354,"sentiment-analysis_deepsentipers_fscore_modified":0.6873376696,"sentiment-analysis_deepsentipers_acc":0.7651471437,"sentiment-analysis_deepsentipers_precision":0.7171241976,"sentiment-analysis_deepsentipers_recall":0.7899883681,"sentiment-analysis_deepsentipers_fscore":0.7353283551,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9347357066,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sentiment-analysis_deepsentipers_acc_modified":0.7521691974,"sentiment-analysis_deepsentipers_precision_modified":0.7149147283,"sentiment-analysis_deepsentipers_recall_modified":0.7661218172,"sentiment-analysis_deepsentipers_fscore_modified":0.7340307684,"sentiment-analysis_deepsentipers_acc":0.7550353838,"sentiment-analysis_deepsentipers_precision":0.7176389542,"sentiment-analysis_deepsentipers_recall":0.7690411709,"sentiment-analysis_deepsentipers_fscore":0.7368278372,"sentiment-analysis_deepsentipers_valid_output_ratio":0.9962039046,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.5949298813,"sentiment-analysis_deepsentipers_precision_modified":0.6633283768,"sentiment-analysis_deepsentipers_recall_modified":0.6739827327,"sentiment-analysis_deepsentipers_fscore_modified":0.597099001,"sentiment-analysis_deepsentipers_acc":0.5958941113,"sentiment-analysis_deepsentipers_precision":0.6644034633,"sentiment-analysis_deepsentipers_recall":0.6750750872,"sentiment-analysis_deepsentipers_fscore":0.5980667466,"sentiment-analysis_deepsentipers_valid_output_ratio":0.998381877,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","sentiment-analysis_deepsentipers_acc_modified":0.7038834951,"sentiment-analysis_deepsentipers_precision_modified":0.6558175114,"sentiment-analysis_deepsentipers_recall_modified":0.7195323034,"sentiment-analysis_deepsentipers_fscore_modified":0.6634075099,"sentiment-analysis_deepsentipers_acc":0.7038834951,"sentiment-analysis_deepsentipers_precision":0.6558175114,"sentiment-analysis_deepsentipers_recall":0.7195323034,"sentiment-analysis_deepsentipers_fscore":0.6634075099,"sentiment-analysis_deepsentipers_valid_output_ratio":1.0,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/sts_FarSICK.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.8606070195,"sts_FarSICK_corrcoef":0.8606070195,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8471466571,"sts_FarSICK_corrcoef":0.8471466571,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8332013424,"sts_FarSICK_corrcoef":0.8332013424,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8602460091,"sts_FarSICK_corrcoef":0.8602460091,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.8624442565,"sts_FarSICK_corrcoef":0.8624442565,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":null,"sts_FarSICK_corrcoef":null,"sts_FarSICK_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8796836219,"sts_FarSICK_corrcoef":0.8796836219,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8509006434,"sts_FarSICK_corrcoef":0.8509006434,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8550824218,"sts_FarSICK_corrcoef":0.8550824218,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.2533632205,"sts_FarSICK_corrcoef":0.8617796616,"sts_FarSICK_valid_output_ratio":0.294,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8346099969,"sts_FarSICK_corrcoef":0.8346099969,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8020636156,"sts_FarSICK_corrcoef":0.8020636156,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.8606070195,"sts_FarSICK_corrcoef":0.8606070195,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8438423833,"sts_FarSICK_corrcoef":0.8438423833,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8471466571,"sts_FarSICK_corrcoef":0.8471466571,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8332013424,"sts_FarSICK_corrcoef":0.8332013424,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.8521163575,"sts_FarSICK_corrcoef":0.8521163575,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.8404353896,"sts_FarSICK_corrcoef":0.8404353896,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8474953563,"sts_FarSICK_corrcoef":0.8474953563,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8602460091,"sts_FarSICK_corrcoef":0.8602460091,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.8624442565,"sts_FarSICK_corrcoef":0.8624442565,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":null,"sts_FarSICK_corrcoef":null,"sts_FarSICK_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8796836219,"sts_FarSICK_corrcoef":0.8796836219,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8509006434,"sts_FarSICK_corrcoef":0.8509006434,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8550824218,"sts_FarSICK_corrcoef":0.8550824218,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.0982656524,"sts_FarSICK_corrcoef":0.9633887492,"sts_FarSICK_valid_output_ratio":0.102,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_FarSICK_corrcoef_modified":0.2533632205,"sts_FarSICK_corrcoef":0.8617796616,"sts_FarSICK_valid_output_ratio":0.294,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8346099969,"sts_FarSICK_corrcoef":0.8346099969,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","sts_FarSICK_corrcoef_modified":0.8020636156,"sts_FarSICK_corrcoef":0.8020636156,"sts_FarSICK_valid_output_ratio":1.0,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/sts_SynPerSTS.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.9639002346,"sts_SynPerSTS_corrcoef":0.9639002346,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9198771683,"sts_SynPerSTS_corrcoef":0.9198771683,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9445586775,"sts_SynPerSTS_corrcoef":0.9445586775,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9587180795,"sts_SynPerSTS_corrcoef":0.9587180795,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.9620104912,"sts_SynPerSTS_corrcoef":0.9620104912,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":null,"sts_SynPerSTS_corrcoef":null,"sts_SynPerSTS_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9583160478,"sts_SynPerSTS_corrcoef":0.9583160478,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9603899338,"sts_SynPerSTS_corrcoef":0.9603899338,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.961773092,"sts_SynPerSTS_corrcoef":0.961773092,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.3217761614,"sts_SynPerSTS_corrcoef":0.8791698399,"sts_SynPerSTS_valid_output_ratio":0.366,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9424987971,"sts_SynPerSTS_corrcoef":0.9424987971,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.8942713775,"sts_SynPerSTS_corrcoef":0.8942713775,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.9639002346,"sts_SynPerSTS_corrcoef":0.9639002346,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9496068485,"sts_SynPerSTS_corrcoef":0.9496068485,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9198771683,"sts_SynPerSTS_corrcoef":0.9198771683,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9445586775,"sts_SynPerSTS_corrcoef":0.9445586775,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.9405179912,"sts_SynPerSTS_corrcoef":0.9405179912,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.9417676956,"sts_SynPerSTS_corrcoef":0.9417676956,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9491290877,"sts_SynPerSTS_corrcoef":0.9491290877,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9587180795,"sts_SynPerSTS_corrcoef":0.9587180795,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.9620104912,"sts_SynPerSTS_corrcoef":0.9620104912,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":null,"sts_SynPerSTS_corrcoef":null,"sts_SynPerSTS_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9583160478,"sts_SynPerSTS_corrcoef":0.9583160478,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9603899338,"sts_SynPerSTS_corrcoef":0.9603899338,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.961773092,"sts_SynPerSTS_corrcoef":0.961773092,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.0975200826,"sts_SynPerSTS_corrcoef":0.9752008261,"sts_SynPerSTS_valid_output_ratio":0.1,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","sts_SynPerSTS_corrcoef_modified":0.3217761614,"sts_SynPerSTS_corrcoef":0.8791698399,"sts_SynPerSTS_valid_output_ratio":0.366,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.9424987971,"sts_SynPerSTS_corrcoef":0.9424987971,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","sts_SynPerSTS_corrcoef_modified":0.8942713775,"sts_SynPerSTS_corrcoef":0.8942713775,"sts_SynPerSTS_valid_output_ratio":1.0,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/summarization_PnSummary.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.1188323392,"summarization_PnSummary_rougeL_recall":0.3948447809,"summarization_PnSummary_rougeL_f1_score":0.1786530476,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1095844839,"summarization_PnSummary_rougeL_recall":0.3735331299,"summarization_PnSummary_rougeL_f1_score":0.1645385252,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1227039295,"summarization_PnSummary_rougeL_recall":0.4315497639,"summarization_PnSummary_rougeL_f1_score":0.1856517383,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1072486168,"summarization_PnSummary_rougeL_recall":0.3966587345,"summarization_PnSummary_rougeL_f1_score":0.1627029568,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.1234743619,"summarization_PnSummary_rougeL_recall":0.376111826,"summarization_PnSummary_rougeL_f1_score":0.1808600563,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":null,"summarization_PnSummary_rougeL_recall":null,"summarization_PnSummary_rougeL_f1_score":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1124574222,"summarization_PnSummary_rougeL_recall":0.3717393409,"summarization_PnSummary_rougeL_f1_score":0.1673025553,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1123870374,"summarization_PnSummary_rougeL_recall":0.4032007327,"summarization_PnSummary_rougeL_f1_score":0.17115848,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1089978489,"summarization_PnSummary_rougeL_recall":0.3936021933,"summarization_PnSummary_rougeL_f1_score":0.1662525669,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.132916538,"summarization_PnSummary_rougeL_recall":0.3579358655,"summarization_PnSummary_rougeL_f1_score":0.1887379797,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1029257145,"summarization_PnSummary_rougeL_recall":0.4347811424,"summarization_PnSummary_rougeL_f1_score":0.1621438757,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.0833149314,"summarization_PnSummary_rougeL_recall":0.4027758903,"summarization_PnSummary_rougeL_f1_score":0.1338404051,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.1188323392,"summarization_PnSummary_rougeL_recall":0.3948447809,"summarization_PnSummary_rougeL_f1_score":0.1786530476,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.0796516779,"summarization_PnSummary_rougeL_recall":0.3573917363,"summarization_PnSummary_rougeL_f1_score":0.1263677591,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1095844839,"summarization_PnSummary_rougeL_recall":0.3735331299,"summarization_PnSummary_rougeL_f1_score":0.1645385252,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1227039295,"summarization_PnSummary_rougeL_recall":0.4315497639,"summarization_PnSummary_rougeL_f1_score":0.1856517383,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.0917305447,"summarization_PnSummary_rougeL_recall":0.3893845098,"summarization_PnSummary_rougeL_f1_score":0.1447284086,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.0830986853,"summarization_PnSummary_rougeL_recall":0.3565850313,"summarization_PnSummary_rougeL_f1_score":0.1308633101,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.0783955467,"summarization_PnSummary_rougeL_recall":0.3671775126,"summarization_PnSummary_rougeL_f1_score":0.1256898612,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1072486168,"summarization_PnSummary_rougeL_recall":0.3966587345,"summarization_PnSummary_rougeL_f1_score":0.1627029568,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.1234743619,"summarization_PnSummary_rougeL_recall":0.376111826,"summarization_PnSummary_rougeL_f1_score":0.1808600563,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":null,"summarization_PnSummary_rougeL_recall":null,"summarization_PnSummary_rougeL_f1_score":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1124574222,"summarization_PnSummary_rougeL_recall":0.3717393409,"summarization_PnSummary_rougeL_f1_score":0.1673025553,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1123870374,"summarization_PnSummary_rougeL_recall":0.4032007327,"summarization_PnSummary_rougeL_f1_score":0.17115848,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1089978489,"summarization_PnSummary_rougeL_recall":0.3936021933,"summarization_PnSummary_rougeL_f1_score":0.1662525669,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1377053282,"summarization_PnSummary_rougeL_recall":0.380073051,"summarization_PnSummary_rougeL_f1_score":0.1928750247,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_PnSummary_rougeL_precision":0.132916538,"summarization_PnSummary_rougeL_recall":0.3579358655,"summarization_PnSummary_rougeL_f1_score":0.1887379797,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.1029257145,"summarization_PnSummary_rougeL_recall":0.4347811424,"summarization_PnSummary_rougeL_f1_score":0.1621438757,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","summarization_PnSummary_rougeL_precision":0.0833149314,"summarization_PnSummary_rougeL_recall":0.4027758903,"summarization_PnSummary_rougeL_f1_score":0.1338404051,"nlg_score":0.112015688}
         | 
    	
        leaderboard/boards_data/summarization_SamSUM-fa.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1538512444,"summarization_SamSUM-fa_rougeL_recall":0.3849531288,"summarization_SamSUM-fa_rougeL_f1_score":0.2115502707,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1638274716,"summarization_SamSUM-fa_rougeL_recall":0.3535878882,"summarization_SamSUM-fa_rougeL_f1_score":0.2134854664,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1591262985,"summarization_SamSUM-fa_rougeL_recall":0.4163090512,"summarization_SamSUM-fa_rougeL_f1_score":0.2208876443,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1468362777,"summarization_SamSUM-fa_rougeL_recall":0.3858089513,"summarization_SamSUM-fa_rougeL_f1_score":0.2041300257,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1681357159,"summarization_SamSUM-fa_rougeL_recall":0.3567938895,"summarization_SamSUM-fa_rougeL_f1_score":0.2189693454,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":null,"summarization_SamSUM-fa_rougeL_recall":null,"summarization_SamSUM-fa_rougeL_f1_score":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1588367988,"summarization_SamSUM-fa_rougeL_recall":0.3735722635,"summarization_SamSUM-fa_rougeL_f1_score":0.2131671502,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1469468837,"summarization_SamSUM-fa_rougeL_recall":0.3743807014,"summarization_SamSUM-fa_rougeL_f1_score":0.2022859929,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1514618398,"summarization_SamSUM-fa_rougeL_recall":0.3683020708,"summarization_SamSUM-fa_rougeL_f1_score":0.2063212948,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1772724525,"summarization_SamSUM-fa_rougeL_recall":0.341583677,"summarization_SamSUM-fa_rougeL_f1_score":0.2233271064,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.147286408,"summarization_SamSUM-fa_rougeL_recall":0.4066657958,"summarization_SamSUM-fa_rougeL_f1_score":0.2072278176,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1137219495,"summarization_SamSUM-fa_rougeL_recall":0.3496708707,"summarization_SamSUM-fa_rougeL_f1_score":0.1628971148,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1538512444,"summarization_SamSUM-fa_rougeL_recall":0.3849531288,"summarization_SamSUM-fa_rougeL_f1_score":0.2115502707,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1076131004,"summarization_SamSUM-fa_rougeL_recall":0.354952604,"summarization_SamSUM-fa_rougeL_f1_score":0.1578241504,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1638274716,"summarization_SamSUM-fa_rougeL_recall":0.3535878882,"summarization_SamSUM-fa_rougeL_f1_score":0.2134854664,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1591262985,"summarization_SamSUM-fa_rougeL_recall":0.4163090512,"summarization_SamSUM-fa_rougeL_f1_score":0.2208876443,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1553547312,"summarization_SamSUM-fa_rougeL_recall":0.3357735524,"summarization_SamSUM-fa_rougeL_f1_score":0.2045988783,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1387162197,"summarization_SamSUM-fa_rougeL_recall":0.3472256524,"summarization_SamSUM-fa_rougeL_f1_score":0.1899415698,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1158613629,"summarization_SamSUM-fa_rougeL_recall":0.3578031642,"summarization_SamSUM-fa_rougeL_f1_score":0.168058919,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1468362777,"summarization_SamSUM-fa_rougeL_recall":0.3858089513,"summarization_SamSUM-fa_rougeL_f1_score":0.2041300257,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1681357159,"summarization_SamSUM-fa_rougeL_recall":0.3567938895,"summarization_SamSUM-fa_rougeL_f1_score":0.2189693454,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":null,"summarization_SamSUM-fa_rougeL_recall":null,"summarization_SamSUM-fa_rougeL_f1_score":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1588367988,"summarization_SamSUM-fa_rougeL_recall":0.3735722635,"summarization_SamSUM-fa_rougeL_f1_score":0.2131671502,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1469468837,"summarization_SamSUM-fa_rougeL_recall":0.3743807014,"summarization_SamSUM-fa_rougeL_f1_score":0.2022859929,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1514618398,"summarization_SamSUM-fa_rougeL_recall":0.3683020708,"summarization_SamSUM-fa_rougeL_f1_score":0.2063212948,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1539866165,"summarization_SamSUM-fa_rougeL_recall":0.341409574,"summarization_SamSUM-fa_rougeL_f1_score":0.2007085976,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","summarization_SamSUM-fa_rougeL_precision":0.1772724525,"summarization_SamSUM-fa_rougeL_recall":0.341583677,"summarization_SamSUM-fa_rougeL_f1_score":0.2233271064,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.147286408,"summarization_SamSUM-fa_rougeL_recall":0.4066657958,"summarization_SamSUM-fa_rougeL_f1_score":0.2072278176,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","summarization_SamSUM-fa_rougeL_precision":0.1137219495,"summarization_SamSUM-fa_rougeL_recall":0.3496708707,"summarization_SamSUM-fa_rougeL_f1_score":0.1628971148,"nlg_score":0.112015688}
         | 
    	
        leaderboard/boards_data/tone-classification_SynTone.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.8198757764,"tone-classification_SynTone_precision_modified":0.8180456965,"tone-classification_SynTone_recall_modified":0.5977640757,"tone-classification_SynTone_fscore_modified":0.6364434216,"tone-classification_SynTone_acc":0.8859060403,"tone-classification_SynTone_precision":0.8839285714,"tone-classification_SynTone_recall":0.6459061489,"tone-classification_SynTone_fscore":0.68770061,"tone-classification_SynTone_valid_output_ratio":0.9254658385,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.5031055901,"tone-classification_SynTone_precision_modified":0.5228364877,"tone-classification_SynTone_recall_modified":0.5168736971,"tone-classification_SynTone_fscore_modified":0.4644759375,"tone-classification_SynTone_acc":0.5094339623,"tone-classification_SynTone_precision":0.5294130473,"tone-classification_SynTone_recall":0.523375253,"tone-classification_SynTone_fscore":0.4703184021,"tone-classification_SynTone_valid_output_ratio":0.9875776398,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.6770186335,"tone-classification_SynTone_precision_modified":0.6041666667,"tone-classification_SynTone_recall_modified":0.5499765318,"tone-classification_SynTone_fscore_modified":0.5393404488,"tone-classification_SynTone_acc":0.6770186335,"tone-classification_SynTone_precision":0.6041666667,"tone-classification_SynTone_recall":0.5499765318,"tone-classification_SynTone_fscore":0.5393404488,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.5776397516,"tone-classification_SynTone_precision_modified":0.4784671979,"tone-classification_SynTone_recall_modified":0.4996211806,"tone-classification_SynTone_fscore_modified":0.4487276462,"tone-classification_SynTone_acc":0.5849056604,"tone-classification_SynTone_precision":0.4844856532,"tone-classification_SynTone_recall":0.5059057238,"tone-classification_SynTone_fscore":0.4543720191,"tone-classification_SynTone_valid_output_ratio":0.9875776398,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.9130434783,"tone-classification_SynTone_precision_modified":0.8396595026,"tone-classification_SynTone_recall_modified":0.7058371736,"tone-classification_SynTone_fscore_modified":0.748745873,"tone-classification_SynTone_acc":0.9130434783,"tone-classification_SynTone_precision":0.8396595026,"tone-classification_SynTone_recall":0.7058371736,"tone-classification_SynTone_fscore":0.748745873,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":null,"tone-classification_SynTone_precision_modified":null,"tone-classification_SynTone_recall_modified":null,"tone-classification_SynTone_fscore_modified":null,"tone-classification_SynTone_acc":null,"tone-classification_SynTone_precision":null,"tone-classification_SynTone_recall":null,"tone-classification_SynTone_fscore":null,"tone-classification_SynTone_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.7888198758,"tone-classification_SynTone_precision_modified":0.6529418051,"tone-classification_SynTone_recall_modified":0.7187467998,"tone-classification_SynTone_fscore_modified":0.6745690521,"tone-classification_SynTone_acc":0.7888198758,"tone-classification_SynTone_precision":0.6529418051,"tone-classification_SynTone_recall":0.7187467998,"tone-classification_SynTone_fscore":0.6745690521,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.4968944099,"tone-classification_SynTone_precision_modified":0.5363835928,"tone-classification_SynTone_recall_modified":0.5772956136,"tone-classification_SynTone_fscore_modified":0.4755414981,"tone-classification_SynTone_acc":0.4968944099,"tone-classification_SynTone_precision":0.5363835928,"tone-classification_SynTone_recall":0.5772956136,"tone-classification_SynTone_fscore":0.4755414981,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.8074534161,"tone-classification_SynTone_precision_modified":0.6799424424,"tone-classification_SynTone_recall_modified":0.6338304318,"tone-classification_SynTone_fscore_modified":0.6490392995,"tone-classification_SynTone_acc":0.8074534161,"tone-classification_SynTone_precision":0.6799424424,"tone-classification_SynTone_recall":0.6338304318,"tone-classification_SynTone_fscore":0.6490392995,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.0,"tone-classification_SynTone_precision_modified":0.0,"tone-classification_SynTone_recall_modified":0.0,"tone-classification_SynTone_fscore_modified":0.0,"tone-classification_SynTone_acc":0.0,"tone-classification_SynTone_precision":0.0,"tone-classification_SynTone_recall":0.0,"tone-classification_SynTone_fscore":0.0,"tone-classification_SynTone_valid_output_ratio":0.0,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.7763975155,"tone-classification_SynTone_precision_modified":0.6774948824,"tone-classification_SynTone_recall_modified":0.67683866,"tone-classification_SynTone_fscore_modified":0.668356732,"tone-classification_SynTone_acc":0.7911392405,"tone-classification_SynTone_precision":0.6903587093,"tone-classification_SynTone_recall":0.689690027,"tone-classification_SynTone_fscore":0.6810470497,"tone-classification_SynTone_valid_output_ratio":0.9813664596,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.1552795031,"tone-classification_SynTone_precision_modified":0.1130928528,"tone-classification_SynTone_recall_modified":0.2155401891,"tone-classification_SynTone_fscore_modified":0.1465713376,"tone-classification_SynTone_acc":0.3424657534,"tone-classification_SynTone_precision":0.2494239631,"tone-classification_SynTone_recall":0.4753694581,"tone-classification_SynTone_fscore":0.3232600733,"tone-classification_SynTone_valid_output_ratio":0.4534161491,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.8198757764,"tone-classification_SynTone_precision_modified":0.8180456965,"tone-classification_SynTone_recall_modified":0.5977640757,"tone-classification_SynTone_fscore_modified":0.6364434216,"tone-classification_SynTone_acc":0.8859060403,"tone-classification_SynTone_precision":0.8839285714,"tone-classification_SynTone_recall":0.6459061489,"tone-classification_SynTone_fscore":0.68770061,"tone-classification_SynTone_valid_output_ratio":0.9254658385,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.801242236,"tone-classification_SynTone_precision_modified":0.6325567597,"tone-classification_SynTone_recall_modified":0.5106323908,"tone-classification_SynTone_fscore_modified":0.5211970678,"tone-classification_SynTone_acc":0.8164556962,"tone-classification_SynTone_precision":0.6445673311,"tone-classification_SynTone_recall":0.5203279425,"tone-classification_SynTone_fscore":0.5310932146,"tone-classification_SynTone_valid_output_ratio":0.9813664596,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.5031055901,"tone-classification_SynTone_precision_modified":0.5228364877,"tone-classification_SynTone_recall_modified":0.5168736971,"tone-classification_SynTone_fscore_modified":0.4644759375,"tone-classification_SynTone_acc":0.5094339623,"tone-classification_SynTone_precision":0.5294130473,"tone-classification_SynTone_recall":0.523375253,"tone-classification_SynTone_fscore":0.4703184021,"tone-classification_SynTone_valid_output_ratio":0.9875776398,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.6770186335,"tone-classification_SynTone_precision_modified":0.6041666667,"tone-classification_SynTone_recall_modified":0.5499765318,"tone-classification_SynTone_fscore_modified":0.5393404488,"tone-classification_SynTone_acc":0.6770186335,"tone-classification_SynTone_precision":0.6041666667,"tone-classification_SynTone_recall":0.5499765318,"tone-classification_SynTone_fscore":0.5393404488,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.8944099379,"tone-classification_SynTone_precision_modified":0.8288135593,"tone-classification_SynTone_recall_modified":0.6730414747,"tone-classification_SynTone_fscore_modified":0.7238560859,"tone-classification_SynTone_acc":0.8944099379,"tone-classification_SynTone_precision":0.8288135593,"tone-classification_SynTone_recall":0.6730414747,"tone-classification_SynTone_fscore":0.7238560859,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.8447204969,"tone-classification_SynTone_precision_modified":0.6820625483,"tone-classification_SynTone_recall_modified":0.5681634349,"tone-classification_SynTone_fscore_modified":0.579448271,"tone-classification_SynTone_acc":0.85,"tone-classification_SynTone_precision":0.6863254393,"tone-classification_SynTone_recall":0.5717144564,"tone-classification_SynTone_fscore":0.5830698227,"tone-classification_SynTone_valid_output_ratio":0.9937888199,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.850931677,"tone-classification_SynTone_precision_modified":0.7155244384,"tone-classification_SynTone_recall_modified":0.5926267281,"tone-classification_SynTone_fscore_modified":0.6120058392,"tone-classification_SynTone_acc":0.850931677,"tone-classification_SynTone_precision":0.7155244384,"tone-classification_SynTone_recall":0.5926267281,"tone-classification_SynTone_fscore":0.6120058392,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.5776397516,"tone-classification_SynTone_precision_modified":0.4784671979,"tone-classification_SynTone_recall_modified":0.4996211806,"tone-classification_SynTone_fscore_modified":0.4487276462,"tone-classification_SynTone_acc":0.5849056604,"tone-classification_SynTone_precision":0.4844856532,"tone-classification_SynTone_recall":0.5059057238,"tone-classification_SynTone_fscore":0.4543720191,"tone-classification_SynTone_valid_output_ratio":0.9875776398,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.9130434783,"tone-classification_SynTone_precision_modified":0.8396595026,"tone-classification_SynTone_recall_modified":0.7058371736,"tone-classification_SynTone_fscore_modified":0.748745873,"tone-classification_SynTone_acc":0.9130434783,"tone-classification_SynTone_precision":0.8396595026,"tone-classification_SynTone_recall":0.7058371736,"tone-classification_SynTone_fscore":0.748745873,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":null,"tone-classification_SynTone_precision_modified":null,"tone-classification_SynTone_recall_modified":null,"tone-classification_SynTone_fscore_modified":null,"tone-classification_SynTone_acc":null,"tone-classification_SynTone_precision":null,"tone-classification_SynTone_recall":null,"tone-classification_SynTone_fscore":null,"tone-classification_SynTone_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.7888198758,"tone-classification_SynTone_precision_modified":0.6529418051,"tone-classification_SynTone_recall_modified":0.7187467998,"tone-classification_SynTone_fscore_modified":0.6745690521,"tone-classification_SynTone_acc":0.7888198758,"tone-classification_SynTone_precision":0.6529418051,"tone-classification_SynTone_recall":0.7187467998,"tone-classification_SynTone_fscore":0.6745690521,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.4968944099,"tone-classification_SynTone_precision_modified":0.5363835928,"tone-classification_SynTone_recall_modified":0.5772956136,"tone-classification_SynTone_fscore_modified":0.4755414981,"tone-classification_SynTone_acc":0.4968944099,"tone-classification_SynTone_precision":0.5363835928,"tone-classification_SynTone_recall":0.5772956136,"tone-classification_SynTone_fscore":0.4755414981,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.8074534161,"tone-classification_SynTone_precision_modified":0.6799424424,"tone-classification_SynTone_recall_modified":0.6338304318,"tone-classification_SynTone_fscore_modified":0.6490392995,"tone-classification_SynTone_acc":0.8074534161,"tone-classification_SynTone_precision":0.6799424424,"tone-classification_SynTone_recall":0.6338304318,"tone-classification_SynTone_fscore":0.6490392995,"tone-classification_SynTone_valid_output_ratio":1.0,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.0310559006,"tone-classification_SynTone_precision_modified":0.0155279503,"tone-classification_SynTone_recall_modified":0.0186335404,"tone-classification_SynTone_fscore_modified":0.0169395822,"tone-classification_SynTone_acc":0.8333333333,"tone-classification_SynTone_precision":0.4166666667,"tone-classification_SynTone_recall":0.5,"tone-classification_SynTone_fscore":0.4545454545,"tone-classification_SynTone_valid_output_ratio":0.0372670807,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","tone-classification_SynTone_acc_modified":0.0,"tone-classification_SynTone_precision_modified":0.0,"tone-classification_SynTone_recall_modified":0.0,"tone-classification_SynTone_fscore_modified":0.0,"tone-classification_SynTone_acc":0.0,"tone-classification_SynTone_precision":0.0,"tone-classification_SynTone_recall":0.0,"tone-classification_SynTone_fscore":0.0,"tone-classification_SynTone_valid_output_ratio":0.0,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.7763975155,"tone-classification_SynTone_precision_modified":0.6774948824,"tone-classification_SynTone_recall_modified":0.67683866,"tone-classification_SynTone_fscore_modified":0.668356732,"tone-classification_SynTone_acc":0.7911392405,"tone-classification_SynTone_precision":0.6903587093,"tone-classification_SynTone_recall":0.689690027,"tone-classification_SynTone_fscore":0.6810470497,"tone-classification_SynTone_valid_output_ratio":0.9813664596,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","tone-classification_SynTone_acc_modified":0.1552795031,"tone-classification_SynTone_precision_modified":0.1130928528,"tone-classification_SynTone_recall_modified":0.2155401891,"tone-classification_SynTone_fscore_modified":0.1465713376,"tone-classification_SynTone_acc":0.3424657534,"tone-classification_SynTone_precision":0.2494239631,"tone-classification_SynTone_recall":0.4753694581,"tone-classification_SynTone_fscore":0.3232600733,"tone-classification_SynTone_valid_output_ratio":0.4534161491,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/topic-classification_sid.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.792,"topic-classification_sid_precision_modified":0.662532811,"topic-classification_sid_recall_modified":0.6635073397,"topic-classification_sid_fscore_modified":0.6583038933,"topic-classification_sid_acc":0.792,"topic-classification_sid_precision":0.662532811,"topic-classification_sid_recall":0.6635073397,"topic-classification_sid_fscore":0.6583038933,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.562,"topic-classification_sid_precision_modified":0.4846723602,"topic-classification_sid_recall_modified":0.454656985,"topic-classification_sid_fscore_modified":0.424509489,"topic-classification_sid_acc":0.5928270042,"topic-classification_sid_precision":0.511257764,"topic-classification_sid_recall":0.4795959757,"topic-classification_sid_fscore":0.4477948196,"topic-classification_sid_valid_output_ratio":0.948,"nlu_score":0.6241793507}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.682,"topic-classification_sid_precision_modified":0.5730049986,"topic-classification_sid_recall_modified":0.5717337985,"topic-classification_sid_fscore_modified":0.5606248332,"topic-classification_sid_acc":0.7239915074,"topic-classification_sid_precision":0.6082855612,"topic-classification_sid_recall":0.6069360918,"topic-classification_sid_fscore":0.595143135,"topic-classification_sid_valid_output_ratio":0.942,"nlu_score":0.6297634971}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.458,"topic-classification_sid_precision_modified":0.3928192753,"topic-classification_sid_recall_modified":0.4072039595,"topic-classification_sid_fscore_modified":0.3544902396,"topic-classification_sid_acc":0.6378830084,"topic-classification_sid_precision":0.5471020547,"topic-classification_sid_recall":0.5671364338,"topic-classification_sid_fscore":0.4937189966,"topic-classification_sid_valid_output_ratio":0.718,"nlu_score":0.6552152029}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.748,"topic-classification_sid_precision_modified":0.6428566774,"topic-classification_sid_recall_modified":0.6633522535,"topic-classification_sid_fscore_modified":0.628605048,"topic-classification_sid_acc":0.748,"topic-classification_sid_precision":0.6428566774,"topic-classification_sid_recall":0.6633522535,"topic-classification_sid_fscore":0.628605048,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":null,"topic-classification_sid_precision_modified":null,"topic-classification_sid_recall_modified":null,"topic-classification_sid_fscore_modified":null,"topic-classification_sid_acc":null,"topic-classification_sid_precision":null,"topic-classification_sid_recall":null,"topic-classification_sid_fscore":null,"topic-classification_sid_valid_output_ratio":null,"nlu_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.702,"topic-classification_sid_precision_modified":0.6070538637,"topic-classification_sid_recall_modified":0.5902772191,"topic-classification_sid_fscore_modified":0.5805725473,"topic-classification_sid_acc":0.7076612903,"topic-classification_sid_precision":0.6119494594,"topic-classification_sid_recall":0.5950375192,"topic-classification_sid_fscore":0.585254584,"topic-classification_sid_valid_output_ratio":0.992,"nlu_score":0.6898261633}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.636,"topic-classification_sid_precision_modified":0.6248180645,"topic-classification_sid_recall_modified":0.5200071748,"topic-classification_sid_fscore_modified":0.5212205085,"topic-classification_sid_acc":0.636,"topic-classification_sid_precision":0.6248180645,"topic-classification_sid_recall":0.5200071748,"topic-classification_sid_fscore":0.5212205085,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.742,"topic-classification_sid_precision_modified":0.6167254178,"topic-classification_sid_recall_modified":0.6125584783,"topic-classification_sid_fscore_modified":0.5990165281,"topic-classification_sid_acc":0.7449799197,"topic-classification_sid_precision":0.6192022267,"topic-classification_sid_recall":0.6150185525,"topic-classification_sid_fscore":0.6014222169,"topic-classification_sid_valid_output_ratio":0.996,"nlu_score":0.6714091535}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.75,"topic-classification_sid_precision_modified":0.6327306402,"topic-classification_sid_recall_modified":0.6347455045,"topic-classification_sid_fscore_modified":0.6231971632,"topic-classification_sid_acc":0.75,"topic-classification_sid_precision":0.6327306402,"topic-classification_sid_recall":0.6347455045,"topic-classification_sid_fscore":0.6231971632,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.3749414991}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.656,"topic-classification_sid_precision_modified":0.5819241823,"topic-classification_sid_recall_modified":0.5649560499,"topic-classification_sid_fscore_modified":0.5472284688,"topic-classification_sid_acc":0.7038626609,"topic-classification_sid_precision":0.6243821699,"topic-classification_sid_recall":0.6061760192,"topic-classification_sid_fscore":0.5871550095,"topic-classification_sid_valid_output_ratio":0.932,"nlu_score":0.5661558794}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.664,"topic-classification_sid_precision_modified":0.5946530353,"topic-classification_sid_recall_modified":0.5719701311,"topic-classification_sid_fscore_modified":0.5732259537,"topic-classification_sid_acc":0.6720647773,"topic-classification_sid_precision":0.6018755418,"topic-classification_sid_recall":0.5789171368,"topic-classification_sid_fscore":0.5801882122,"topic-classification_sid_valid_output_ratio":0.988,"nlu_score":0.456845738}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.792,"topic-classification_sid_precision_modified":0.662532811,"topic-classification_sid_recall_modified":0.6635073397,"topic-classification_sid_fscore_modified":0.6583038933,"topic-classification_sid_acc":0.792,"topic-classification_sid_precision":0.662532811,"topic-classification_sid_recall":0.6635073397,"topic-classification_sid_fscore":0.6583038933,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.7143086066}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.674,"topic-classification_sid_precision_modified":0.583557125,"topic-classification_sid_recall_modified":0.5945763405,"topic-classification_sid_fscore_modified":0.5786133505,"topic-classification_sid_acc":0.6962809917,"topic-classification_sid_precision":0.6028482696,"topic-classification_sid_recall":0.6142317567,"topic-classification_sid_fscore":0.5977410646,"topic-classification_sid_valid_output_ratio":0.968,"nlu_score":0.628506628}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.562,"topic-classification_sid_precision_modified":0.4846723602,"topic-classification_sid_recall_modified":0.454656985,"topic-classification_sid_fscore_modified":0.424509489,"topic-classification_sid_acc":0.5928270042,"topic-classification_sid_precision":0.511257764,"topic-classification_sid_recall":0.4795959757,"topic-classification_sid_fscore":0.4477948196,"topic-classification_sid_valid_output_ratio":0.948,"nlu_score":0.6241793507}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.682,"topic-classification_sid_precision_modified":0.5730049986,"topic-classification_sid_recall_modified":0.5717337985,"topic-classification_sid_fscore_modified":0.5606248332,"topic-classification_sid_acc":0.7239915074,"topic-classification_sid_precision":0.6082855612,"topic-classification_sid_recall":0.6069360918,"topic-classification_sid_fscore":0.595143135,"topic-classification_sid_valid_output_ratio":0.942,"nlu_score":0.6297634971}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.77,"topic-classification_sid_precision_modified":0.6850986976,"topic-classification_sid_recall_modified":0.6830888647,"topic-classification_sid_fscore_modified":0.6616877857,"topic-classification_sid_acc":0.77,"topic-classification_sid_precision":0.6850986976,"topic-classification_sid_recall":0.6830888647,"topic-classification_sid_fscore":0.6616877857,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.7144353486}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.704,"topic-classification_sid_precision_modified":0.5896102708,"topic-classification_sid_recall_modified":0.5884196886,"topic-classification_sid_fscore_modified":0.5823719558,"topic-classification_sid_acc":0.704,"topic-classification_sid_precision":0.5896102708,"topic-classification_sid_recall":0.5884196886,"topic-classification_sid_fscore":0.5823719558,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.6749652797}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.712,"topic-classification_sid_precision_modified":0.6353150272,"topic-classification_sid_recall_modified":0.6244451357,"topic-classification_sid_fscore_modified":0.601429389,"topic-classification_sid_acc":0.712,"topic-classification_sid_precision":0.6353150272,"topic-classification_sid_recall":0.6244451357,"topic-classification_sid_fscore":0.601429389,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.6552939868}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.458,"topic-classification_sid_precision_modified":0.3928192753,"topic-classification_sid_recall_modified":0.4072039595,"topic-classification_sid_fscore_modified":0.3544902396,"topic-classification_sid_acc":0.6378830084,"topic-classification_sid_precision":0.5471020547,"topic-classification_sid_recall":0.5671364338,"topic-classification_sid_fscore":0.4937189966,"topic-classification_sid_valid_output_ratio":0.718,"nlu_score":0.6552152029}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.748,"topic-classification_sid_precision_modified":0.6428566774,"topic-classification_sid_recall_modified":0.6633522535,"topic-classification_sid_fscore_modified":0.628605048,"topic-classification_sid_acc":0.748,"topic-classification_sid_precision":0.6428566774,"topic-classification_sid_recall":0.6633522535,"topic-classification_sid_fscore":0.628605048,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.6758278127}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":null,"topic-classification_sid_precision_modified":null,"topic-classification_sid_recall_modified":null,"topic-classification_sid_fscore_modified":null,"topic-classification_sid_acc":null,"topic-classification_sid_precision":null,"topic-classification_sid_recall":null,"topic-classification_sid_fscore":null,"topic-classification_sid_valid_output_ratio":null,"nlu_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.702,"topic-classification_sid_precision_modified":0.6070538637,"topic-classification_sid_recall_modified":0.5902772191,"topic-classification_sid_fscore_modified":0.5805725473,"topic-classification_sid_acc":0.7076612903,"topic-classification_sid_precision":0.6119494594,"topic-classification_sid_recall":0.5950375192,"topic-classification_sid_fscore":0.585254584,"topic-classification_sid_valid_output_ratio":0.992,"nlu_score":0.6898261633}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.636,"topic-classification_sid_precision_modified":0.6248180645,"topic-classification_sid_recall_modified":0.5200071748,"topic-classification_sid_fscore_modified":0.5212205085,"topic-classification_sid_acc":0.636,"topic-classification_sid_precision":0.6248180645,"topic-classification_sid_recall":0.5200071748,"topic-classification_sid_fscore":0.5212205085,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.6460328733}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.742,"topic-classification_sid_precision_modified":0.6167254178,"topic-classification_sid_recall_modified":0.6125584783,"topic-classification_sid_fscore_modified":0.5990165281,"topic-classification_sid_acc":0.7449799197,"topic-classification_sid_precision":0.6192022267,"topic-classification_sid_recall":0.6150185525,"topic-classification_sid_fscore":0.6014222169,"topic-classification_sid_valid_output_ratio":0.996,"nlu_score":0.6714091535}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.62,"topic-classification_sid_precision_modified":0.5570257373,"topic-classification_sid_recall_modified":0.5619595288,"topic-classification_sid_fscore_modified":0.5217673603,"topic-classification_sid_acc":0.6540084388,"topic-classification_sid_precision":0.5875798917,"topic-classification_sid_recall":0.5927843131,"topic-classification_sid_fscore":0.5503875108,"topic-classification_sid_valid_output_ratio":0.948,"nlu_score":0.4086928082}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","topic-classification_sid_acc_modified":0.75,"topic-classification_sid_precision_modified":0.6327306402,"topic-classification_sid_recall_modified":0.6347455045,"topic-classification_sid_fscore_modified":0.6231971632,"topic-classification_sid_acc":0.75,"topic-classification_sid_precision":0.6327306402,"topic-classification_sid_recall":0.6347455045,"topic-classification_sid_fscore":0.6231971632,"topic-classification_sid_valid_output_ratio":1.0,"nlu_score":0.3749414991}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.656,"topic-classification_sid_precision_modified":0.5819241823,"topic-classification_sid_recall_modified":0.5649560499,"topic-classification_sid_fscore_modified":0.5472284688,"topic-classification_sid_acc":0.7038626609,"topic-classification_sid_precision":0.6243821699,"topic-classification_sid_recall":0.6061760192,"topic-classification_sid_fscore":0.5871550095,"topic-classification_sid_valid_output_ratio":0.932,"nlu_score":0.5661558794}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","topic-classification_sid_acc_modified":0.664,"topic-classification_sid_precision_modified":0.5946530353,"topic-classification_sid_recall_modified":0.5719701311,"topic-classification_sid_fscore_modified":0.5732259537,"topic-classification_sid_acc":0.6720647773,"topic-classification_sid_precision":0.6018755418,"topic-classification_sid_recall":0.5789171368,"topic-classification_sid_fscore":0.5801882122,"topic-classification_sid_valid_output_ratio":0.988,"nlu_score":0.456845738}
         | 
    	
        leaderboard/boards_data/translation-ar2fa_ar2fa.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.1471879954,"translation-ar2fa_ar2fa_sahife_bleu":0.1294214814,"translation-ar2fa_ar2fa_nahj_bleu":0.0642841927,"translation-ar2fa_ar2fa_quran_bleu":0.2437131219,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0186923531,"translation-ar2fa_ar2fa_sahife_bleu":0.0174521967,"translation-ar2fa_ar2fa_nahj_bleu":0.0097734226,"translation-ar2fa_ar2fa_quran_bleu":0.0284054936,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.1414109272,"translation-ar2fa_ar2fa_sahife_bleu":0.136408042,"translation-ar2fa_ar2fa_nahj_bleu":0.0653197648,"translation-ar2fa_ar2fa_quran_bleu":0.2187004167,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0226935201,"translation-ar2fa_ar2fa_sahife_bleu":0.0196359142,"translation-ar2fa_ar2fa_nahj_bleu":0.010693835,"translation-ar2fa_ar2fa_quran_bleu":0.0371508269,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.1534130086,"translation-ar2fa_ar2fa_sahife_bleu":0.1250461134,"translation-ar2fa_ar2fa_nahj_bleu":0.0624466634,"translation-ar2fa_ar2fa_quran_bleu":0.2681979318,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":null,"translation-ar2fa_ar2fa_sahife_bleu":null,"translation-ar2fa_ar2fa_nahj_bleu":null,"translation-ar2fa_ar2fa_quran_bleu":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0465792583,"translation-ar2fa_ar2fa_sahife_bleu":0.023795336,"translation-ar2fa_ar2fa_nahj_bleu":0.0121091058,"translation-ar2fa_ar2fa_quran_bleu":0.1021098256,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0910450298,"translation-ar2fa_ar2fa_sahife_bleu":0.0862679894,"translation-ar2fa_ar2fa_nahj_bleu":0.0558129824,"translation-ar2fa_ar2fa_quran_bleu":0.1292925153,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0985860814,"translation-ar2fa_ar2fa_sahife_bleu":0.0857687109,"translation-ar2fa_ar2fa_nahj_bleu":0.0622600203,"translation-ar2fa_ar2fa_quran_bleu":0.1459132099,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.0581992714,"translation-ar2fa_ar2fa_sahife_bleu":0.0540221076,"translation-ar2fa_ar2fa_nahj_bleu":0.0233017704,"translation-ar2fa_ar2fa_quran_bleu":0.095529061,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0594554675,"translation-ar2fa_ar2fa_sahife_bleu":0.0539986603,"translation-ar2fa_ar2fa_nahj_bleu":0.035240584,"translation-ar2fa_ar2fa_quran_bleu":0.0879164142,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0439654732,"translation-ar2fa_ar2fa_sahife_bleu":0.0313283708,"translation-ar2fa_ar2fa_nahj_bleu":0.0308641232,"translation-ar2fa_ar2fa_quran_bleu":0.0690488581,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.1471879954,"translation-ar2fa_ar2fa_sahife_bleu":0.1294214814,"translation-ar2fa_ar2fa_nahj_bleu":0.0642841927,"translation-ar2fa_ar2fa_quran_bleu":0.2437131219,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0704966071,"translation-ar2fa_ar2fa_sahife_bleu":0.0675578984,"translation-ar2fa_ar2fa_nahj_bleu":0.042116411,"translation-ar2fa_ar2fa_quran_bleu":0.1003965021,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0186923531,"translation-ar2fa_ar2fa_sahife_bleu":0.0174521967,"translation-ar2fa_ar2fa_nahj_bleu":0.0097734226,"translation-ar2fa_ar2fa_quran_bleu":0.0284054936,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.1414109272,"translation-ar2fa_ar2fa_sahife_bleu":0.136408042,"translation-ar2fa_ar2fa_nahj_bleu":0.0653197648,"translation-ar2fa_ar2fa_quran_bleu":0.2187004167,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.1334075162,"translation-ar2fa_ar2fa_sahife_bleu":0.1143867102,"translation-ar2fa_ar2fa_nahj_bleu":0.063272709,"translation-ar2fa_ar2fa_quran_bleu":0.2190563892,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.1183647194,"translation-ar2fa_ar2fa_sahife_bleu":0.0905358622,"translation-ar2fa_ar2fa_nahj_bleu":0.0522591914,"translation-ar2fa_ar2fa_quran_bleu":0.2089938281,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0975905866,"translation-ar2fa_ar2fa_sahife_bleu":0.0824300354,"translation-ar2fa_ar2fa_nahj_bleu":0.0513812903,"translation-ar2fa_ar2fa_quran_bleu":0.1566499693,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0226935201,"translation-ar2fa_ar2fa_sahife_bleu":0.0196359142,"translation-ar2fa_ar2fa_nahj_bleu":0.010693835,"translation-ar2fa_ar2fa_quran_bleu":0.0371508269,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.1534130086,"translation-ar2fa_ar2fa_sahife_bleu":0.1250461134,"translation-ar2fa_ar2fa_nahj_bleu":0.0624466634,"translation-ar2fa_ar2fa_quran_bleu":0.2681979318,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":null,"translation-ar2fa_ar2fa_sahife_bleu":null,"translation-ar2fa_ar2fa_nahj_bleu":null,"translation-ar2fa_ar2fa_quran_bleu":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0465792583,"translation-ar2fa_ar2fa_sahife_bleu":0.023795336,"translation-ar2fa_ar2fa_nahj_bleu":0.0121091058,"translation-ar2fa_ar2fa_quran_bleu":0.1021098256,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0910450298,"translation-ar2fa_ar2fa_sahife_bleu":0.0862679894,"translation-ar2fa_ar2fa_nahj_bleu":0.0558129824,"translation-ar2fa_ar2fa_quran_bleu":0.1292925153,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0985860814,"translation-ar2fa_ar2fa_sahife_bleu":0.0857687109,"translation-ar2fa_ar2fa_nahj_bleu":0.0622600203,"translation-ar2fa_ar2fa_quran_bleu":0.1459132099,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0997661237,"translation-ar2fa_ar2fa_sahife_bleu":0.0880416079,"translation-ar2fa_ar2fa_nahj_bleu":0.0425251453,"translation-ar2fa_ar2fa_quran_bleu":0.165869569,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-ar2fa_ar2fa_bleu":0.0581992714,"translation-ar2fa_ar2fa_sahife_bleu":0.0540221076,"translation-ar2fa_ar2fa_nahj_bleu":0.0233017704,"translation-ar2fa_ar2fa_quran_bleu":0.095529061,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0594554675,"translation-ar2fa_ar2fa_sahife_bleu":0.0539986603,"translation-ar2fa_ar2fa_nahj_bleu":0.035240584,"translation-ar2fa_ar2fa_quran_bleu":0.0879164142,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-ar2fa_ar2fa_bleu":0.0439654732,"translation-ar2fa_ar2fa_sahife_bleu":0.0313283708,"translation-ar2fa_ar2fa_nahj_bleu":0.0308641232,"translation-ar2fa_ar2fa_quran_bleu":0.0690488581,"nlg_score":0.112015688}
         | 
    	
        leaderboard/boards_data/translation-en2fa_en2fa.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.1799534349,"translation-en2fa_en2fa_epoque_bleu":0.4004213933,"translation-en2fa_en2fa_mizan_bleu":0.1703393716,"translation-en2fa_en2fa_quran_bleu":0.1225698669,"translation-en2fa_en2fa_sahife_bleu":0.0832764011,"translation-en2fa_en2fa_nahj_bleu":0.0439108113,"translation-en2fa_en2fa_tep_bleu":0.0595417592,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.0366912467,"translation-en2fa_en2fa_epoque_bleu":0.0623359898,"translation-en2fa_en2fa_mizan_bleu":0.0442763597,"translation-en2fa_en2fa_quran_bleu":0.0309309044,"translation-en2fa_en2fa_sahife_bleu":0.0330663757,"translation-en2fa_en2fa_nahj_bleu":0.0124767847,"translation-en2fa_en2fa_tep_bleu":0.0116612774,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.2018158808,"translation-en2fa_en2fa_epoque_bleu":0.4332944681,"translation-en2fa_en2fa_mizan_bleu":0.1925182751,"translation-en2fa_en2fa_quran_bleu":0.1530925462,"translation-en2fa_en2fa_sahife_bleu":0.1026499453,"translation-en2fa_en2fa_nahj_bleu":0.051968827,"translation-en2fa_en2fa_tep_bleu":0.0708487287,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.0600629844,"translation-en2fa_en2fa_epoque_bleu":0.1538216141,"translation-en2fa_en2fa_mizan_bleu":0.0548001026,"translation-en2fa_en2fa_quran_bleu":0.0217436833,"translation-en2fa_en2fa_sahife_bleu":0.0205645274,"translation-en2fa_en2fa_nahj_bleu":0.0172427415,"translation-en2fa_en2fa_tep_bleu":0.0093260061,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.1974288311,"translation-en2fa_en2fa_epoque_bleu":0.4102902123,"translation-en2fa_en2fa_mizan_bleu":0.1898606624,"translation-en2fa_en2fa_quran_bleu":0.1638084791,"translation-en2fa_en2fa_sahife_bleu":0.1095493859,"translation-en2fa_en2fa_nahj_bleu":0.0487097316,"translation-en2fa_en2fa_tep_bleu":0.0737497745,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":null,"translation-en2fa_en2fa_epoque_bleu":null,"translation-en2fa_en2fa_mizan_bleu":null,"translation-en2fa_en2fa_quran_bleu":null,"translation-en2fa_en2fa_sahife_bleu":null,"translation-en2fa_en2fa_nahj_bleu":null,"translation-en2fa_en2fa_tep_bleu":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.0439502467,"translation-en2fa_en2fa_epoque_bleu":0.0932804064,"translation-en2fa_en2fa_mizan_bleu":0.0446467932,"translation-en2fa_en2fa_quran_bleu":0.0435800727,"translation-en2fa_en2fa_sahife_bleu":0.0197005921,"translation-en2fa_en2fa_nahj_bleu":0.0132822652,"translation-en2fa_en2fa_tep_bleu":0.0087342692,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1535253787,"translation-en2fa_en2fa_epoque_bleu":0.3553678809,"translation-en2fa_en2fa_mizan_bleu":0.1285441922,"translation-en2fa_en2fa_quran_bleu":0.0857809616,"translation-en2fa_en2fa_sahife_bleu":0.0787025343,"translation-en2fa_en2fa_nahj_bleu":0.0404850935,"translation-en2fa_en2fa_tep_bleu":0.0586129062,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1623218856,"translation-en2fa_en2fa_epoque_bleu":0.3677879105,"translation-en2fa_en2fa_mizan_bleu":0.147599732,"translation-en2fa_en2fa_quran_bleu":0.0938457658,"translation-en2fa_en2fa_sahife_bleu":0.0698903005,"translation-en2fa_en2fa_nahj_bleu":0.0435129812,"translation-en2fa_en2fa_tep_bleu":0.0620337306,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.056370201,"translation-en2fa_en2fa_epoque_bleu":0.1154392548,"translation-en2fa_en2fa_mizan_bleu":0.0484324583,"translation-en2fa_en2fa_quran_bleu":0.0612465488,"translation-en2fa_en2fa_sahife_bleu":0.0466818991,"translation-en2fa_en2fa_nahj_bleu":0.0218444477,"translation-en2fa_en2fa_tep_bleu":0.0118186665,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1458447378,"translation-en2fa_en2fa_epoque_bleu":0.3541508677,"translation-en2fa_en2fa_mizan_bleu":0.1259468635,"translation-en2fa_en2fa_quran_bleu":0.0887225632,"translation-en2fa_en2fa_sahife_bleu":0.0672732746,"translation-en2fa_en2fa_nahj_bleu":0.0407327793,"translation-en2fa_en2fa_tep_bleu":0.0293172873,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.111865825,"translation-en2fa_en2fa_epoque_bleu":0.2732051575,"translation-en2fa_en2fa_mizan_bleu":0.0868500698,"translation-en2fa_en2fa_quran_bleu":0.0529852068,"translation-en2fa_en2fa_sahife_bleu":0.0502293343,"translation-en2fa_en2fa_nahj_bleu":0.0322064942,"translation-en2fa_en2fa_tep_bleu":0.0404507778,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.1799534349,"translation-en2fa_en2fa_epoque_bleu":0.4004213933,"translation-en2fa_en2fa_mizan_bleu":0.1703393716,"translation-en2fa_en2fa_quran_bleu":0.1225698669,"translation-en2fa_en2fa_sahife_bleu":0.0832764011,"translation-en2fa_en2fa_nahj_bleu":0.0439108113,"translation-en2fa_en2fa_tep_bleu":0.0595417592,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1482164359,"translation-en2fa_en2fa_epoque_bleu":0.3332313032,"translation-en2fa_en2fa_mizan_bleu":0.1348649993,"translation-en2fa_en2fa_quran_bleu":0.0798910499,"translation-en2fa_en2fa_sahife_bleu":0.0724923326,"translation-en2fa_en2fa_nahj_bleu":0.0425031053,"translation-en2fa_en2fa_tep_bleu":0.0570157331,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.0366912467,"translation-en2fa_en2fa_epoque_bleu":0.0623359898,"translation-en2fa_en2fa_mizan_bleu":0.0442763597,"translation-en2fa_en2fa_quran_bleu":0.0309309044,"translation-en2fa_en2fa_sahife_bleu":0.0330663757,"translation-en2fa_en2fa_nahj_bleu":0.0124767847,"translation-en2fa_en2fa_tep_bleu":0.0116612774,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.2018158808,"translation-en2fa_en2fa_epoque_bleu":0.4332944681,"translation-en2fa_en2fa_mizan_bleu":0.1925182751,"translation-en2fa_en2fa_quran_bleu":0.1530925462,"translation-en2fa_en2fa_sahife_bleu":0.1026499453,"translation-en2fa_en2fa_nahj_bleu":0.051968827,"translation-en2fa_en2fa_tep_bleu":0.0708487287,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.1757431213,"translation-en2fa_en2fa_epoque_bleu":0.3745398253,"translation-en2fa_en2fa_mizan_bleu":0.1640890656,"translation-en2fa_en2fa_quran_bleu":0.1377843747,"translation-en2fa_en2fa_sahife_bleu":0.0895949257,"translation-en2fa_en2fa_nahj_bleu":0.0437585905,"translation-en2fa_en2fa_tep_bleu":0.0679088622,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.1700971031,"translation-en2fa_en2fa_epoque_bleu":0.3619925896,"translation-en2fa_en2fa_mizan_bleu":0.1638764762,"translation-en2fa_en2fa_quran_bleu":0.1169026899,"translation-en2fa_en2fa_sahife_bleu":0.0785107337,"translation-en2fa_en2fa_nahj_bleu":0.0463016599,"translation-en2fa_en2fa_tep_bleu":0.0704424388,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1608795131,"translation-en2fa_en2fa_epoque_bleu":0.3578688062,"translation-en2fa_en2fa_mizan_bleu":0.1485917499,"translation-en2fa_en2fa_quran_bleu":0.094218512,"translation-en2fa_en2fa_sahife_bleu":0.0778161632,"translation-en2fa_en2fa_nahj_bleu":0.0434765061,"translation-en2fa_en2fa_tep_bleu":0.0618688381,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.0600629844,"translation-en2fa_en2fa_epoque_bleu":0.1538216141,"translation-en2fa_en2fa_mizan_bleu":0.0548001026,"translation-en2fa_en2fa_quran_bleu":0.0217436833,"translation-en2fa_en2fa_sahife_bleu":0.0205645274,"translation-en2fa_en2fa_nahj_bleu":0.0172427415,"translation-en2fa_en2fa_tep_bleu":0.0093260061,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.1974288311,"translation-en2fa_en2fa_epoque_bleu":0.4102902123,"translation-en2fa_en2fa_mizan_bleu":0.1898606624,"translation-en2fa_en2fa_quran_bleu":0.1638084791,"translation-en2fa_en2fa_sahife_bleu":0.1095493859,"translation-en2fa_en2fa_nahj_bleu":0.0487097316,"translation-en2fa_en2fa_tep_bleu":0.0737497745,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":null,"translation-en2fa_en2fa_epoque_bleu":null,"translation-en2fa_en2fa_mizan_bleu":null,"translation-en2fa_en2fa_quran_bleu":null,"translation-en2fa_en2fa_sahife_bleu":null,"translation-en2fa_en2fa_nahj_bleu":null,"translation-en2fa_en2fa_tep_bleu":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.0439502467,"translation-en2fa_en2fa_epoque_bleu":0.0932804064,"translation-en2fa_en2fa_mizan_bleu":0.0446467932,"translation-en2fa_en2fa_quran_bleu":0.0435800727,"translation-en2fa_en2fa_sahife_bleu":0.0197005921,"translation-en2fa_en2fa_nahj_bleu":0.0132822652,"translation-en2fa_en2fa_tep_bleu":0.0087342692,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1535253787,"translation-en2fa_en2fa_epoque_bleu":0.3553678809,"translation-en2fa_en2fa_mizan_bleu":0.1285441922,"translation-en2fa_en2fa_quran_bleu":0.0857809616,"translation-en2fa_en2fa_sahife_bleu":0.0787025343,"translation-en2fa_en2fa_nahj_bleu":0.0404850935,"translation-en2fa_en2fa_tep_bleu":0.0586129062,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1623218856,"translation-en2fa_en2fa_epoque_bleu":0.3677879105,"translation-en2fa_en2fa_mizan_bleu":0.147599732,"translation-en2fa_en2fa_quran_bleu":0.0938457658,"translation-en2fa_en2fa_sahife_bleu":0.0698903005,"translation-en2fa_en2fa_nahj_bleu":0.0435129812,"translation-en2fa_en2fa_tep_bleu":0.0620337306,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1694667296,"translation-en2fa_en2fa_epoque_bleu":0.3980975238,"translation-en2fa_en2fa_mizan_bleu":0.1400810731,"translation-en2fa_en2fa_quran_bleu":0.1173019123,"translation-en2fa_en2fa_sahife_bleu":0.0758825134,"translation-en2fa_en2fa_nahj_bleu":0.0380397952,"translation-en2fa_en2fa_tep_bleu":0.05711699,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-en2fa_en2fa_bleu":0.056370201,"translation-en2fa_en2fa_epoque_bleu":0.1154392548,"translation-en2fa_en2fa_mizan_bleu":0.0484324583,"translation-en2fa_en2fa_quran_bleu":0.0612465488,"translation-en2fa_en2fa_sahife_bleu":0.0466818991,"translation-en2fa_en2fa_nahj_bleu":0.0218444477,"translation-en2fa_en2fa_tep_bleu":0.0118186665,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.1458447378,"translation-en2fa_en2fa_epoque_bleu":0.3541508677,"translation-en2fa_en2fa_mizan_bleu":0.1259468635,"translation-en2fa_en2fa_quran_bleu":0.0887225632,"translation-en2fa_en2fa_sahife_bleu":0.0672732746,"translation-en2fa_en2fa_nahj_bleu":0.0407327793,"translation-en2fa_en2fa_tep_bleu":0.0293172873,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-en2fa_en2fa_bleu":0.111865825,"translation-en2fa_en2fa_epoque_bleu":0.2732051575,"translation-en2fa_en2fa_mizan_bleu":0.0868500698,"translation-en2fa_en2fa_quran_bleu":0.0529852068,"translation-en2fa_en2fa_sahife_bleu":0.0502293343,"translation-en2fa_en2fa_nahj_bleu":0.0322064942,"translation-en2fa_en2fa_tep_bleu":0.0404507778,"nlg_score":0.112015688}
         | 
    	
        leaderboard/boards_data/translation-fa2ar_fa2ar.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0761269879,"translation-fa2ar_fa2ar_nahj_bleu":0.0321440801,"translation-fa2ar_fa2ar_sahife_bleu":0.0613632957,"translation-fa2ar_fa2ar_quran_bleu":0.134873588,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0067928767,"translation-fa2ar_fa2ar_nahj_bleu":0.0056689454,"translation-fa2ar_fa2ar_sahife_bleu":0.009024465,"translation-fa2ar_fa2ar_quran_bleu":0.0056852198,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0922998074,"translation-fa2ar_fa2ar_nahj_bleu":0.0511154919,"translation-fa2ar_fa2ar_sahife_bleu":0.0589808221,"translation-fa2ar_fa2ar_quran_bleu":0.1668031083,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0086214593,"translation-fa2ar_fa2ar_nahj_bleu":0.006894051,"translation-fa2ar_fa2ar_sahife_bleu":0.009695506,"translation-fa2ar_fa2ar_quran_bleu":0.0092748209,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0827618418,"translation-fa2ar_fa2ar_nahj_bleu":0.038434531,"translation-fa2ar_fa2ar_sahife_bleu":0.0781455938,"translation-fa2ar_fa2ar_quran_bleu":0.1317054007,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":null,"translation-fa2ar_fa2ar_nahj_bleu":null,"translation-fa2ar_fa2ar_sahife_bleu":null,"translation-fa2ar_fa2ar_quran_bleu":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0100630648,"translation-fa2ar_fa2ar_nahj_bleu":0.0071647909,"translation-fa2ar_fa2ar_sahife_bleu":0.0101185743,"translation-fa2ar_fa2ar_quran_bleu":0.0129058292,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0494411806,"translation-fa2ar_fa2ar_nahj_bleu":0.0369805868,"translation-fa2ar_fa2ar_sahife_bleu":0.0567654991,"translation-fa2ar_fa2ar_quran_bleu":0.0545774559,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0507003531,"translation-fa2ar_fa2ar_nahj_bleu":0.0316047659,"translation-fa2ar_fa2ar_sahife_bleu":0.0534488007,"translation-fa2ar_fa2ar_quran_bleu":0.0670474926,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0331262129,"translation-fa2ar_fa2ar_nahj_bleu":0.0202107323,"translation-fa2ar_fa2ar_sahife_bleu":0.0280883311,"translation-fa2ar_fa2ar_quran_bleu":0.0510795752,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0192357288,"translation-fa2ar_fa2ar_nahj_bleu":0.0151369319,"translation-fa2ar_fa2ar_sahife_bleu":0.0245784397,"translation-fa2ar_fa2ar_quran_bleu":0.0179918148,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0058610145,"translation-fa2ar_fa2ar_nahj_bleu":0.0063998692,"translation-fa2ar_fa2ar_sahife_bleu":0.0068172489,"translation-fa2ar_fa2ar_quran_bleu":0.0043275898,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0761269879,"translation-fa2ar_fa2ar_nahj_bleu":0.0321440801,"translation-fa2ar_fa2ar_sahife_bleu":0.0613632957,"translation-fa2ar_fa2ar_quran_bleu":0.134873588,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0287298887,"translation-fa2ar_fa2ar_nahj_bleu":0.025061663,"translation-fa2ar_fa2ar_sahife_bleu":0.0355711393,"translation-fa2ar_fa2ar_quran_bleu":0.0255568639,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0067928767,"translation-fa2ar_fa2ar_nahj_bleu":0.0056689454,"translation-fa2ar_fa2ar_sahife_bleu":0.009024465,"translation-fa2ar_fa2ar_quran_bleu":0.0056852198,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0922998074,"translation-fa2ar_fa2ar_nahj_bleu":0.0511154919,"translation-fa2ar_fa2ar_sahife_bleu":0.0589808221,"translation-fa2ar_fa2ar_quran_bleu":0.1668031083,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0720575119,"translation-fa2ar_fa2ar_nahj_bleu":0.037394526,"translation-fa2ar_fa2ar_sahife_bleu":0.0636064419,"translation-fa2ar_fa2ar_quran_bleu":0.1151715676,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0564204856,"translation-fa2ar_fa2ar_nahj_bleu":0.0345882932,"translation-fa2ar_fa2ar_sahife_bleu":0.0554604649,"translation-fa2ar_fa2ar_quran_bleu":0.0792126988,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0374749811,"translation-fa2ar_fa2ar_nahj_bleu":0.0275129836,"translation-fa2ar_fa2ar_sahife_bleu":0.0412173132,"translation-fa2ar_fa2ar_quran_bleu":0.0436946465,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0086214593,"translation-fa2ar_fa2ar_nahj_bleu":0.006894051,"translation-fa2ar_fa2ar_sahife_bleu":0.009695506,"translation-fa2ar_fa2ar_quran_bleu":0.0092748209,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0827618418,"translation-fa2ar_fa2ar_nahj_bleu":0.038434531,"translation-fa2ar_fa2ar_sahife_bleu":0.0781455938,"translation-fa2ar_fa2ar_quran_bleu":0.1317054007,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":null,"translation-fa2ar_fa2ar_nahj_bleu":null,"translation-fa2ar_fa2ar_sahife_bleu":null,"translation-fa2ar_fa2ar_quran_bleu":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0100630648,"translation-fa2ar_fa2ar_nahj_bleu":0.0071647909,"translation-fa2ar_fa2ar_sahife_bleu":0.0101185743,"translation-fa2ar_fa2ar_quran_bleu":0.0129058292,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0494411806,"translation-fa2ar_fa2ar_nahj_bleu":0.0369805868,"translation-fa2ar_fa2ar_sahife_bleu":0.0567654991,"translation-fa2ar_fa2ar_quran_bleu":0.0545774559,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0507003531,"translation-fa2ar_fa2ar_nahj_bleu":0.0316047659,"translation-fa2ar_fa2ar_sahife_bleu":0.0534488007,"translation-fa2ar_fa2ar_quran_bleu":0.0670474926,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0548753777,"translation-fa2ar_fa2ar_nahj_bleu":0.0318327001,"translation-fa2ar_fa2ar_sahife_bleu":0.0567893259,"translation-fa2ar_fa2ar_quran_bleu":0.076004107,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2ar_fa2ar_bleu":0.0331262129,"translation-fa2ar_fa2ar_nahj_bleu":0.0202107323,"translation-fa2ar_fa2ar_sahife_bleu":0.0280883311,"translation-fa2ar_fa2ar_quran_bleu":0.0510795752,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0192357288,"translation-fa2ar_fa2ar_nahj_bleu":0.0151369319,"translation-fa2ar_fa2ar_sahife_bleu":0.0245784397,"translation-fa2ar_fa2ar_quran_bleu":0.0179918148,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-fa2ar_fa2ar_bleu":0.0058610145,"translation-fa2ar_fa2ar_nahj_bleu":0.0063998692,"translation-fa2ar_fa2ar_sahife_bleu":0.0068172489,"translation-fa2ar_fa2ar_quran_bleu":0.0043275898,"nlg_score":0.112015688}
         | 
    	
        leaderboard/boards_data/translation-fa2en_fa2en.jsonl
    CHANGED
    
    | @@ -1,6 +1,10 @@ | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.2247897554,"translation-fa2en_fa2en_tep_bleu":0.1341840946,"translation-fa2en_fa2en_mizan_bleu":0.1909021288,"translation-fa2en_fa2en_quran_bleu":0.1740971535,"translation-fa2en_fa2en_epoque_bleu":0.4544315204,"translation-fa2en_fa2en_nahj_bleu":0.0877235615,"translation-fa2en_fa2en_sahife_bleu":0.0975791022,"nlg_score":0.1779340777}
         | 
|  | |
| 2 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.016856047,"translation-fa2en_fa2en_tep_bleu":0.0085125001,"translation-fa2en_fa2en_mizan_bleu":0.013661635,"translation-fa2en_fa2en_quran_bleu":0.0181666202,"translation-fa2en_fa2en_epoque_bleu":0.0301282339,"translation-fa2en_fa2en_nahj_bleu":0.0122360126,"translation-fa2en_fa2en_sahife_bleu":0.0110323989,"nlg_score":0.0949943578}
         | 
| 3 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.2337569687,"translation-fa2en_fa2en_tep_bleu":0.1386371644,"translation-fa2en_fa2en_mizan_bleu":0.2129637469,"translation-fa2en_fa2en_quran_bleu":0.1702102457,"translation-fa2en_fa2en_epoque_bleu":0.478211182,"translation-fa2en_fa2en_nahj_bleu":0.083013513,"translation-fa2en_fa2en_sahife_bleu":0.072000292,"nlg_score":0.1880477876}
         | 
|  | |
|  | |
|  | |
| 4 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.0196181945,"translation-fa2en_fa2en_tep_bleu":0.0101636027,"translation-fa2en_fa2en_mizan_bleu":0.0153753718,"translation-fa2en_fa2en_quran_bleu":0.0231110679,"translation-fa2en_fa2en_epoque_bleu":0.0359429205,"translation-fa2en_fa2en_nahj_bleu":0.0119451943,"translation-fa2en_fa2en_sahife_bleu":0.0117936527,"nlg_score":0.0940241349}
         | 
| 5 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.2307102128,"translation-fa2en_fa2en_tep_bleu":0.1527807458,"translation-fa2en_fa2en_mizan_bleu":0.1927067243,"translation-fa2en_fa2en_quran_bleu":0.1628198329,"translation-fa2en_fa2en_epoque_bleu":0.4676472481,"translation-fa2en_fa2en_nahj_bleu":0.0810494281,"translation-fa2en_fa2en_sahife_bleu":0.1009417344,"nlg_score":0.194675133}
         | 
| 6 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":null,"translation-fa2en_fa2en_tep_bleu":null,"translation-fa2en_fa2en_mizan_bleu":null,"translation-fa2en_fa2en_quran_bleu":null,"translation-fa2en_fa2en_epoque_bleu":null,"translation-fa2en_fa2en_nahj_bleu":null,"translation-fa2en_fa2en_sahife_bleu":null,"nlg_score":null}
         | 
| @@ -8,6 +12,7 @@ | |
| 8 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.0199585579,"translation-fa2en_fa2en_tep_bleu":0.0097804397,"translation-fa2en_fa2en_mizan_bleu":0.0144809896,"translation-fa2en_fa2en_quran_bleu":0.0259691427,"translation-fa2en_fa2en_epoque_bleu":0.0345304173,"translation-fa2en_fa2en_nahj_bleu":0.0150589625,"translation-fa2en_fa2en_sahife_bleu":0.0157047184,"nlg_score":0.1067134448}
         | 
| 9 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.2145488085,"translation-fa2en_fa2en_tep_bleu":0.1307272464,"translation-fa2en_fa2en_mizan_bleu":0.1697754862,"translation-fa2en_fa2en_quran_bleu":0.1552415558,"translation-fa2en_fa2en_epoque_bleu":0.4513682579,"translation-fa2en_fa2en_nahj_bleu":0.0842673472,"translation-fa2en_fa2en_sahife_bleu":0.0853787118,"nlg_score":0.16056333}
         | 
| 10 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.217991447,"translation-fa2en_fa2en_tep_bleu":0.1271542443,"translation-fa2en_fa2en_mizan_bleu":0.1728081337,"translation-fa2en_fa2en_quran_bleu":0.158860515,"translation-fa2en_fa2en_epoque_bleu":0.4572670962,"translation-fa2en_fa2en_nahj_bleu":0.0902445729,"translation-fa2en_fa2en_sahife_bleu":0.0945000287,"nlg_score":0.1679338638}
         | 
|  | |
| 11 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.0691353117,"translation-fa2en_fa2en_tep_bleu":0.0320908261,"translation-fa2en_fa2en_mizan_bleu":0.0535229905,"translation-fa2en_fa2en_quran_bleu":0.0800143919,"translation-fa2en_fa2en_epoque_bleu":0.133977443,"translation-fa2en_fa2en_nahj_bleu":0.0362958954,"translation-fa2en_fa2en_sahife_bleu":0.0393317574,"nlg_score":0.1089333827}
         | 
| 12 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1451163884,"translation-fa2en_fa2en_tep_bleu":0.0393307601,"translation-fa2en_fa2en_mizan_bleu":0.1009347025,"translation-fa2en_fa2en_quran_bleu":0.0929688918,"translation-fa2en_fa2en_epoque_bleu":0.3660914464,"translation-fa2en_fa2en_nahj_bleu":0.0536507876,"translation-fa2en_fa2en_sahife_bleu":0.05038339,"nlg_score":0.1319091735}
         | 
| 13 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1249013271,"translation-fa2en_fa2en_tep_bleu":0.0564543942,"translation-fa2en_fa2en_mizan_bleu":0.0739643668,"translation-fa2en_fa2en_quran_bleu":0.0677317381,"translation-fa2en_fa2en_epoque_bleu":0.3111968032,"translation-fa2en_fa2en_nahj_bleu":0.0523541092,"translation-fa2en_fa2en_sahife_bleu":0.0479821907,"nlg_score":0.112015688}
         | 
|  | |
| 1 | 
             
            {"Model Name":"claude-3-7-sonnet-20250219","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.2247897554,"translation-fa2en_fa2en_tep_bleu":0.1341840946,"translation-fa2en_fa2en_mizan_bleu":0.1909021288,"translation-fa2en_fa2en_quran_bleu":0.1740971535,"translation-fa2en_fa2en_epoque_bleu":0.4544315204,"translation-fa2en_fa2en_nahj_bleu":0.0877235615,"translation-fa2en_fa2en_sahife_bleu":0.0975791022,"nlg_score":0.1779340777}
         | 
| 2 | 
            +
            {"Model Name":"gpt-oss:20b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1811060704,"translation-fa2en_fa2en_tep_bleu":0.1180786789,"translation-fa2en_fa2en_mizan_bleu":0.1503794353,"translation-fa2en_fa2en_quran_bleu":0.1042682142,"translation-fa2en_fa2en_epoque_bleu":0.3794274854,"translation-fa2en_fa2en_nahj_bleu":0.0641545233,"translation-fa2en_fa2en_sahife_bleu":0.0772362522,"nlg_score":0.1334687319}
         | 
| 3 | 
             
            {"Model Name":"gemma-3-4b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"4300000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.016856047,"translation-fa2en_fa2en_tep_bleu":0.0085125001,"translation-fa2en_fa2en_mizan_bleu":0.013661635,"translation-fa2en_fa2en_quran_bleu":0.0181666202,"translation-fa2en_fa2en_epoque_bleu":0.0301282339,"translation-fa2en_fa2en_nahj_bleu":0.0122360126,"translation-fa2en_fa2en_sahife_bleu":0.0110323989,"nlg_score":0.0949943578}
         | 
| 4 | 
             
            {"Model Name":"c4ai-command-r-plus","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"104000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.2337569687,"translation-fa2en_fa2en_tep_bleu":0.1386371644,"translation-fa2en_fa2en_mizan_bleu":0.2129637469,"translation-fa2en_fa2en_quran_bleu":0.1702102457,"translation-fa2en_fa2en_epoque_bleu":0.478211182,"translation-fa2en_fa2en_nahj_bleu":0.083013513,"translation-fa2en_fa2en_sahife_bleu":0.072000292,"nlg_score":0.1880477876}
         | 
| 5 | 
            +
            {"Model Name":"gpt-5-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.2435498156,"translation-fa2en_fa2en_tep_bleu":0.1656898075,"translation-fa2en_fa2en_mizan_bleu":0.2055420364,"translation-fa2en_fa2en_quran_bleu":0.1726910304,"translation-fa2en_fa2en_epoque_bleu":0.4912890145,"translation-fa2en_fa2en_nahj_bleu":0.0882784037,"translation-fa2en_fa2en_sahife_bleu":0.0952319793,"nlg_score":0.181552926}
         | 
| 6 | 
            +
            {"Model Name":"gpt-5-nano","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.2293783795,"translation-fa2en_fa2en_tep_bleu":0.1348246647,"translation-fa2en_fa2en_mizan_bleu":0.1880942935,"translation-fa2en_fa2en_quran_bleu":0.1642751236,"translation-fa2en_fa2en_epoque_bleu":0.4821448205,"translation-fa2en_fa2en_nahj_bleu":0.0857659109,"translation-fa2en_fa2en_sahife_bleu":0.0914041173,"nlg_score":0.1643361642}
         | 
| 7 | 
            +
            {"Model Name":"gpt-oss:120b","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"20000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1889897396,"translation-fa2en_fa2en_tep_bleu":0.1330232097,"translation-fa2en_fa2en_mizan_bleu":0.1552418193,"translation-fa2en_fa2en_quran_bleu":0.1151586178,"translation-fa2en_fa2en_epoque_bleu":0.3895907069,"translation-fa2en_fa2en_nahj_bleu":0.0701778462,"translation-fa2en_fa2en_sahife_bleu":0.0722357071,"nlg_score":0.1454089411}
         | 
| 8 | 
             
            {"Model Name":"gemma-3n-E4B-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"7850000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.0196181945,"translation-fa2en_fa2en_tep_bleu":0.0101636027,"translation-fa2en_fa2en_mizan_bleu":0.0153753718,"translation-fa2en_fa2en_quran_bleu":0.0231110679,"translation-fa2en_fa2en_epoque_bleu":0.0359429205,"translation-fa2en_fa2en_nahj_bleu":0.0119451943,"translation-fa2en_fa2en_sahife_bleu":0.0117936527,"nlg_score":0.0940241349}
         | 
| 9 | 
             
            {"Model Name":"gpt-4.1","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.2307102128,"translation-fa2en_fa2en_tep_bleu":0.1527807458,"translation-fa2en_fa2en_mizan_bleu":0.1927067243,"translation-fa2en_fa2en_quran_bleu":0.1628198329,"translation-fa2en_fa2en_epoque_bleu":0.4676472481,"translation-fa2en_fa2en_nahj_bleu":0.0810494281,"translation-fa2en_fa2en_sahife_bleu":0.1009417344,"nlg_score":0.194675133}
         | 
| 10 | 
             
            {"Model Name":"o4-mini","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":null,"translation-fa2en_fa2en_tep_bleu":null,"translation-fa2en_fa2en_mizan_bleu":null,"translation-fa2en_fa2en_quran_bleu":null,"translation-fa2en_fa2en_epoque_bleu":null,"translation-fa2en_fa2en_nahj_bleu":null,"translation-fa2en_fa2en_sahife_bleu":null,"nlg_score":null}
         | 
|  | |
| 12 | 
             
            {"Model Name":"gemma-3-27b-it","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"27400000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.0199585579,"translation-fa2en_fa2en_tep_bleu":0.0097804397,"translation-fa2en_fa2en_mizan_bleu":0.0144809896,"translation-fa2en_fa2en_quran_bleu":0.0259691427,"translation-fa2en_fa2en_epoque_bleu":0.0345304173,"translation-fa2en_fa2en_nahj_bleu":0.0150589625,"translation-fa2en_fa2en_sahife_bleu":0.0157047184,"nlg_score":0.1067134448}
         | 
| 13 | 
             
            {"Model Name":"Qwen3-14B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"14800000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.2145488085,"translation-fa2en_fa2en_tep_bleu":0.1307272464,"translation-fa2en_fa2en_mizan_bleu":0.1697754862,"translation-fa2en_fa2en_quran_bleu":0.1552415558,"translation-fa2en_fa2en_epoque_bleu":0.4513682579,"translation-fa2en_fa2en_nahj_bleu":0.0842673472,"translation-fa2en_fa2en_sahife_bleu":0.0853787118,"nlg_score":0.16056333}
         | 
| 14 | 
             
            {"Model Name":"Qwen3-32B","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"32800000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.217991447,"translation-fa2en_fa2en_tep_bleu":0.1271542443,"translation-fa2en_fa2en_mizan_bleu":0.1728081337,"translation-fa2en_fa2en_quran_bleu":0.158860515,"translation-fa2en_fa2en_epoque_bleu":0.4572670962,"translation-fa2en_fa2en_nahj_bleu":0.0902445729,"translation-fa2en_fa2en_sahife_bleu":0.0945000287,"nlg_score":0.1679338638}
         | 
| 15 | 
            +
            {"Model Name":"llama4:scout","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"109000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1909462413,"translation-fa2en_fa2en_tep_bleu":0.1038996524,"translation-fa2en_fa2en_mizan_bleu":0.1513900262,"translation-fa2en_fa2en_quran_bleu":0.129609905,"translation-fa2en_fa2en_epoque_bleu":0.4266734606,"translation-fa2en_fa2en_nahj_bleu":0.0619630431,"translation-fa2en_fa2en_sahife_bleu":0.0584029483,"nlg_score":0.1567965528}
         | 
| 16 | 
             
            {"Model Name":"claude-3-5-haiku-20241022","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"None","source_type":"Closed-Source","translation-fa2en_fa2en_bleu":0.0691353117,"translation-fa2en_fa2en_tep_bleu":0.0320908261,"translation-fa2en_fa2en_mizan_bleu":0.0535229905,"translation-fa2en_fa2en_quran_bleu":0.0800143919,"translation-fa2en_fa2en_epoque_bleu":0.133977443,"translation-fa2en_fa2en_nahj_bleu":0.0362958954,"translation-fa2en_fa2en_sahife_bleu":0.0393317574,"nlg_score":0.1089333827}
         | 
| 17 | 
             
            {"Model Name":"Mistral-Small-3.1-24B-Instruct-2503","thinking_method":"β","model_url":"https:\/\/google.com","parameters_count":"24000000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1451163884,"translation-fa2en_fa2en_tep_bleu":0.0393307601,"translation-fa2en_fa2en_mizan_bleu":0.1009347025,"translation-fa2en_fa2en_quran_bleu":0.0929688918,"translation-fa2en_fa2en_epoque_bleu":0.3660914464,"translation-fa2en_fa2en_nahj_bleu":0.0536507876,"translation-fa2en_fa2en_sahife_bleu":0.05038339,"nlg_score":0.1319091735}
         | 
| 18 | 
             
            {"Model Name":"DeepSeek-R1-0528-Qwen3-8B","thinking_method":"βοΈ","model_url":"https:\/\/google.com","parameters_count":"8190000000","source_type":"Open-Source","translation-fa2en_fa2en_bleu":0.1249013271,"translation-fa2en_fa2en_tep_bleu":0.0564543942,"translation-fa2en_fa2en_mizan_bleu":0.0739643668,"translation-fa2en_fa2en_quran_bleu":0.0677317381,"translation-fa2en_fa2en_epoque_bleu":0.3111968032,"translation-fa2en_fa2en_nahj_bleu":0.0523541092,"translation-fa2en_fa2en_sahife_bleu":0.0479821907,"nlg_score":0.112015688}
         | 
    	
        leaderboard/leaderboard_config.yaml
    CHANGED
    
    | @@ -241,6 +241,31 @@ model_display_configs: | |
| 241 | 
             
                url: "https://huggingface.co/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B"
         | 
| 242 | 
             
                thinking: "βοΈ" # Sure
         | 
| 243 |  | 
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
| 244 | 
             
              # Add one entry for each model whose display name or URL you want to customize.
         | 
| 245 | 
             
              # If a model ID from your data is not listed here, its raw ID will be used as its name.
         | 
| 246 |  | 
|  | |
| 241 | 
             
                url: "https://huggingface.co/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B"
         | 
| 242 | 
             
                thinking: "βοΈ" # Sure
         | 
| 243 |  | 
| 244 | 
            +
              "gpt-5-mini":
         | 
| 245 | 
            +
                display_name: "GPT-5 Mini"
         | 
| 246 | 
            +
                url: "https://openai.com/index/introducing-gpt-5/"
         | 
| 247 | 
            +
                thinking: "βοΈ"
         | 
| 248 | 
            +
             | 
| 249 | 
            +
              "gpt-5-nano":
         | 
| 250 | 
            +
                display_name: "GPT-5 Nano"
         | 
| 251 | 
            +
                url: "https://openai.com/index/introducing-gpt-5/"
         | 
| 252 | 
            +
                thinking: "βοΈ"
         | 
| 253 | 
            +
             | 
| 254 | 
            +
              "gpt-oss:120b":
         | 
| 255 | 
            +
                display_name: "GPT-OSS 120B"
         | 
| 256 | 
            +
                url: "https://openai.com/index/introducing-gpt-oss/"
         | 
| 257 | 
            +
                thinking: "βοΈ"
         | 
| 258 | 
            +
             | 
| 259 | 
            +
              "gpt-oss:20b":
         | 
| 260 | 
            +
                display_name: "GPT-OSS 20B"
         | 
| 261 | 
            +
                url: "https://openai.com/index/introducing-gpt-oss/"
         | 
| 262 | 
            +
                thinking: "βοΈ"
         | 
| 263 | 
            +
             | 
| 264 | 
            +
              "llama4:scout":
         | 
| 265 | 
            +
                display_name: "Llama 4 Scout"
         | 
| 266 | 
            +
                url: "https://ai.meta.com/blog/llama-4-multimodal-intelligence/"
         | 
| 267 | 
            +
                thinking: "β"
         | 
| 268 | 
            +
             | 
| 269 | 
             
              # Add one entry for each model whose display name or URL you want to customize.
         | 
| 270 | 
             
              # If a model ID from your data is not listed here, its raw ID will be used as its name.
         | 
| 271 |  | 
