Spaces:

kasimali
/

new-asr-vox

Running

App Files Files Community

new-asr-vox / app.py

kasimali

Upload folder using huggingface_hub

0f5e1cb verified 2 months ago

raw

history blame contribute delete

90.6 kB

	# NEW-ASR-VOX

	# ==============================================================================
	# Cell 1: Complete Setup - Based on Your Working VoxLingua Code
	# ==============================================================================

	import os, re, glob, csv
	import torch
	import pandas as pd
	import numpy as np
	from sklearn.metrics import accuracy_score, confusion_matrix
	from speechbrain.inference.classifiers import EncoderClassifier
	from speechbrain.pretrained.interfaces import foreign_class
	import torchaudio
	import warnings
	warnings.filterwarnings('ignore')

	device = "cuda" if torch.cuda.is_available() else "cpu"
	print(f"Using device: {device}")


	# ==============================================================================
	# Cell 2: Load Multiple Language Detection Models for Ensemble
	# ==============================================================================
	print("🔄 Loading Multiple Language Detection Models...")

	# Model 1: VoxLingua107 ECAPA-TDNN (Your working baseline - 40% weight)
	voxlingua_model = None
	try:
	print("Loading VoxLingua107 ECAPA-TDNN...")
	voxlingua_model = EncoderClassifier.from_hparams(
	source="speechbrain/lang-id-voxlingua107-ecapa",
	savedir="pretrained_models/langid_voxlingua107_ecapa",
	run_opts={"device": device}
	)
	print("✅ VoxLingua107 loaded successfully")
	except Exception as e:
	print(f"❌ VoxLingua107 failed: {e}")

	# Model 2: XLS-R Language ID (35% weight)
	xlsr_lid_model = None
	try:
	print("Loading TalTechNLP XLS-R Language ID...")
	xlsr_lid_model = foreign_class(
	source="TalTechNLP/voxlingua107-xls-r-300m-wav2vec",
	pymodule_file="encoder_wav2vec_classifier.py",
	classname="EncoderWav2vecClassifier",
	hparams_file="inference_wav2vec.yaml",
	savedir="pretrained_models/xlsr_voxlingua",
	run_opts={"device": device}
	)
	print("✅ XLS-R Language ID loaded successfully")
	except Exception as e:
	print(f"❌ XLS-R failed: {e}")

	models_loaded = sum(p is not None for p in [voxlingua_model, xlsr_lid_model])
	print(f"\n📊 Models loaded: {models_loaded}/2")


	# ==============================================================================
	# Cell 3: Complete Language Mappings from Your Dataset
	# ==============================================================================

	# All languages from your dataset (based on the accuracy table you showed)
	DATASET_LANGUAGES = {
	# Indo-Aryan Languages
	'ur', 'pa', 'hi', 'bn', 'ne', 'as', 'ks', 'mr', 'gu', 'or',
	# Dravidian Languages
	'ta', 'te', 'kn', 'ml',
	# Low-Resource Languages
	'sd', 'kok', 'br', 'doi', 'sat', 'mni',
	# Others in your dataset
	'sa' # Sanskrit
	}

	# Language Family Classifications
	INDO_ARYAN_LANGS = {'ur', 'pa', 'hi', 'bn', 'ne', 'as', 'ks', 'mr', 'gu', 'or', 'sd'}
	DRAVIDIAN_LANGS = {'ta', 'te', 'kn', 'ml'}
	LOW_RESOURCE_LANGS = {'kok', 'br', 'doi', 'sat', 'mni'}
	OTHER_LANGS = {'sa'} # Sanskrit

	ALL_SUPPORTED_LANGS = INDO_ARYAN_LANGS \| DRAVIDIAN_LANGS \| LOW_RESOURCE_LANGS \| OTHER_LANGS

	# Cross-Lingual Transfer Mappings (Research-Based)
	TRANSFER_MAPPINGS = {
	# Low-resource to high-resource language mappings
	'br': 'hi', # Bodo → Hindi (brx mapped to br in your dataset)
	'sat': 'hi', # Santali → Hindi
	'doi': 'pa', # Dogri → Punjabi
	'mni': 'bn', # Manipuri → Bengali
	'kok': 'mr', # Konkani → Marathi (geographic proximity)
	'sd': 'hi', # Sindhi → Hindi
	}

	# Language Code Mappings (VoxLingua output to your dataset codes)
	VOXLINGUA_TO_DATASET = {
	'urd': 'ur', 'urdu': 'ur',
	'pan': 'pa', 'punjabi': 'pa', 'pnb': 'pa',
	'hin': 'hi', 'hindi': 'hi',
	'ben': 'bn', 'bengali': 'bn',
	'nep': 'ne', 'nepali': 'ne',
	'asm': 'as', 'assamese': 'as',
	'kas': 'ks', 'kashmiri': 'ks',
	'mar': 'mr', 'marathi': 'mr',
	'guj': 'gu', 'gujarati': 'gu',
	'ori': 'or', 'odia': 'or', 'ory': 'or',
	'tam': 'ta', 'tamil': 'ta',
	'tel': 'te', 'telugu': 'te',
	'kan': 'kn', 'kannada': 'kn',
	'mal': 'ml', 'malayalam': 'ml',
	'sin': 'sd', 'sindhi': 'sd', 'snd': 'sd',
	'kok': 'kok', 'konkani': 'kok',
	'san': 'sa', 'sanskrit': 'sa',
	# Common variations
	'bho': 'hi', # Bhojpuri → Hindi
	'mai': 'hi', # Maithili → Hindi
	'mag': 'hi', # Magahi → Hindi
	}

	print("✅ Complete language mappings loaded")
	print(f"📊 Total dataset languages: {len(ALL_SUPPORTED_LANGS)}")
	print(f"📊 Mapping variations: {len(VOXLINGUA_TO_DATASET)}")


	# ==============================================================================
	# Cell 4: Enhanced Parsing Functions (Your Working Code + Improvements)
	# ==============================================================================

	def parse_top1(out):
	"""Parse VoxLingua107 output - your exact working function"""
	logits, log_conf, pred_idx, labels = out
	label_str = labels[0] if (isinstance(labels, (list, tuple)) and len(labels) > 0) else "unknown"
	if not isinstance(label_str, str):
	label_str = str(label_str)
	colon_pos = label_str.find(":")
	if colon_pos != -1:
	iso = label_str[:colon_pos].strip()
	else:
	iso = label_str.strip()
	conf = float(log_conf.exp().item())
	return iso, label_str, conf

	def parse_xlsr_output(out):
	"""Parse XLS-R model output"""
	try:
	out_prob, score, index, text_lab = out
	lang_code = str(text_lab[0]).strip().lower()
	confidence = float(out_prob.exp().max().item())
	return lang_code, confidence
	except Exception as e:
	print(f" XLS-R parsing error: {e}")
	return "unknown", 0.0

	def map_to_dataset_language(detected_lang):
	"""Map VoxLingua/XLS-R output to your dataset language codes"""

	# Direct match first
	if detected_lang in ALL_SUPPORTED_LANGS:
	return detected_lang

	# Check mapping dictionary
	mapped = VOXLINGUA_TO_DATASET.get(detected_lang.lower(), detected_lang)

	# If still not in dataset, try transfer mapping
	if mapped not in ALL_SUPPORTED_LANGS and mapped in TRANSFER_MAPPINGS:
	transfer_target = TRANSFER_MAPPINGS[mapped]
	print(f" Transfer mapping: {mapped} → {transfer_target}")
	return transfer_target

	return mapped

	print("✅ Enhanced parsing functions ready")


	# ==============================================================================
	# Cell 5: Hybrid Multi-Model Language Detection
	# ==============================================================================

	def hybrid_language_detection(audio_path):
	"""
	Multi-model ensemble language detection optimized for your dataset
	"""

	print(f" 🎧 Analyzing: {os.path.basename(audio_path)}")

	predictions = {}
	confidences = {}

	# Model 1: VoxLingua107 (Primary - 60% weight since it's your working baseline)
	if voxlingua_model is not None:
	try:
	out = voxlingua_model.classify_file(audio_path)
	pred_iso, pred_label, conf = parse_top1(out)

	# Map to dataset language codes
	mapped_lang = map_to_dataset_language(pred_iso)

	predictions['voxlingua'] = mapped_lang
	confidences['voxlingua'] = conf * 0.60 # 60% weight
	print(f" VoxLingua107: {pred_iso} → {mapped_lang} ({conf:.3f})")

	except Exception as e:
	print(f" VoxLingua107 error: {e}")

	# Model 2: XLS-R (Secondary - 40% weight)
	if xlsr_lid_model is not None:
	try:
	out = xlsr_lid_model.classify_file(audio_path)
	lang_code, conf = parse_xlsr_output(out)

	# Map to dataset language codes
	mapped_lang = map_to_dataset_language(lang_code)

	predictions['xlsr'] = mapped_lang
	confidences['xlsr'] = conf * 0.40 # 40% weight
	print(f" XLS-R: {lang_code} → {mapped_lang} ({conf:.3f})")

	except Exception as e:
	print(f" XLS-R error: {e}")

	# Ensemble Decision Making
	if not predictions:
	return "unknown", 0.0

	# Strategy 1: Check for agreement between models
	if len(predictions) >= 2:
	pred_values = list(predictions.values())
	if pred_values[0] == pred_values[1]: # Models agree
	consensus_lang = pred_values[0]
	avg_confidence = sum(confidences.values()) / len(confidences)
	print(f" 🎯 Consensus: {consensus_lang} (confidence: {avg_confidence:.3f})")
	return consensus_lang, avg_confidence

	# Strategy 2: Use highest weighted confidence
	if confidences:
	best_model = max(confidences.keys(), key=lambda k: confidences[k])
	best_lang = predictions[best_model]
	best_conf = confidences[best_model] / (0.60 if best_model == 'voxlingua' else 0.40) # Normalize

	print(f" 🎯 Best model ({best_model}): {best_lang} (confidence: {best_conf:.3f})")
	return best_lang, best_conf

	return "unknown", 0.0

	print("✅ Hybrid ensemble language detection ready")


	# ==============================================================================
	# Cell 6: Complete Ground Truth Extraction for Your Dataset
	# ==============================================================================

	def gt_from_filename(path):
	"""Extract ground truth from filename - complete version for your dataset"""

	name = os.path.basename(path).lower()

	# Pattern 1: Your working regex pattern
	GT_TOKEN = re.compile(r'(?:^\|[_-])([a-z]{2,4})(?:[_-]\|$)', re.IGNORECASE)
	m = GT_TOKEN.search(name)

	if m:
	code = m.group(1).lower()

	# Complete mapping based on your dataset structure
	filename_mappings = {
	# Your working mappings
	"guf": "gu", "mrt": "mr", "ml": "ml",

	# Additional mappings for your complete dataset
	"urd": "ur", "urdu": "ur",
	"pan": "pa", "punjabi": "pa", "pnb": "pa",
	"hin": "hi", "hindi": "hi",
	"ben": "bn", "bengali": "bn", "bng": "bn",
	"nep": "ne", "nepali": "ne",
	"asm": "as", "assamese": "as",
	"kas": "ks", "kashmiri": "ks",
	"mar": "mr", "marathi": "mr",
	"guj": "gu", "gujarati": "gu",
	"ori": "or", "odia": "or", "ory": "or",
	"tam": "ta", "tamil": "ta",
	"tel": "te", "telugu": "te",
	"kan": "kn", "kannada": "kn",
	"mal": "ml", "malayalam": "ml",
	"sin": "sd", "sindhi": "sd", "snd": "sd",
	"kok": "kok", "konkani": "kok",
	"bod": "br", "bodo": "br", # Bodo variations
	"dog": "doi", "dogri": "doi",
	"sat": "sat", "santali": "sat",
	"mni": "mni", "manipuri": "mni",
	"san": "sa", "sanskrit": "sa",
	}

	mapped_code = filename_mappings.get(code, code)

	# Validate against your dataset languages
	if mapped_code in ALL_SUPPORTED_LANGS:
	return mapped_code

	# Pattern 2: Check folder structure
	path_parts = path.split('/')
	for part in path_parts:
	part_lower = part.lower()
	if part_lower in ALL_SUPPORTED_LANGS:
	return part_lower
	# Check if it's a language name folder
	for full_name, code in [('gujarati', 'gu'), ('marathi', 'mr'), ('hindi', 'hi'),
	('bengali', 'bn'), ('tamil', 'ta'), ('telugu', 'te'),
	('kannada', 'kn'), ('malayalam', 'ml'), ('punjabi', 'pa'),
	('urdu', 'ur'), ('assamese', 'as'), ('odia', 'or'),
	('nepali', 'ne'), ('kashmiri', 'ks'), ('sindhi', 'sd'),
	('konkani', 'kok'), ('bodo', 'br'), ('dogri', 'doi'),
	('santali', 'sat'), ('manipuri', 'mni'), ('sanskrit', 'sa')]:
	if full_name in part_lower:
	return code

	return None

	print("✅ Complete ground truth extraction ready")


	# ==============================================================================
	# Cell 7: Google Drive Processing with Error Handling
	# ==============================================================================

	def download_and_process_drive_dataset():
	"""Download and process with robust error handling"""

	print("📁 Processing Google Drive dataset...")

	# Get sharing link
	share_link = input("🔗 Enter Google Drive sharing link: ").strip()

	if not share_link:
	print("❌ No link provided")
	return []

	# Extract file ID
	def extract_file_id(link):
	patterns = [r'/folders/([a-zA-Z0-9-_]+)', r'id=([a-zA-Z0-9-_]+)', r'/file/d/([a-zA-Z0-9-_]+)']
	for pattern in patterns:
	match = re.search(pattern, link)
	if match:
	return match.group(1)
	return None

	file_id = extract_file_id(share_link)
	if not file_id:
	print("❌ Could not extract file ID from sharing link")
	return []

	# Setup download directory
	download_dir = "/content/drive_dataset"
	if os.path.exists(download_dir):
	import shutil
	shutil.rmtree(download_dir)
	os.makedirs(download_dir, exist_ok=True)

	# Download with error handling
	try:
	import gdown
	print(f"📥 Downloading from Google Drive (ID: {file_id})...")
	gdown.download_folder(f"https://drive.google.com/drive/folders/{file_id}",
	output=download_dir, quiet=False, use_cookies=False)
	print("✅ Download completed successfully")

	except Exception as e:
	print(f"❌ Download failed: {e}")
	print("💡 Make sure the folder is shared with 'Anyone with the link can view'")
	return []

	# Scan for audio files
	VALID_EXTS = {".wav", ".mp3", ".flac", ".m4a", ".ogg"}

	def is_audio(filepath):
	return os.path.splitext(filepath)[1].lower() in VALID_EXTS

	print("🔍 Scanning for audio files...")
	all_files = []

	for root, dirs, files in os.walk(download_dir):
	for file in files:
	if is_audio(file):
	full_path = os.path.join(root, file)
	all_files.append(full_path)

	print(f"📊 Found {len(all_files)} total audio files")

	# Filter and limit files
	filtered_files = []
	lang_counts = {}
	english_skipped = 0

	for file_path in all_files:
	# Skip English files
	if any(eng_indicator in file_path.lower() for eng_indicator in
	['english', '_en_', '/en/', 'eng_', '_eng']):
	english_skipped += 1
	continue

	# Extract language for limiting
	gt_lang = gt_from_filename(file_path)
	if gt_lang:
	lang_counts[gt_lang] = lang_counts.get(gt_lang, 0)
	if lang_counts[gt_lang] < 5: # Max 5 per language
	filtered_files.append(file_path)
	lang_counts[gt_lang] += 1
	else:
	# Include files without clear language markers (up to overall limit)
	if len(filtered_files) < 50:
	filtered_files.append(file_path)

	print(f"📊 Filtered results:")
	print(f" English files skipped: {english_skipped}")
	print(f" Selected for processing: {len(filtered_files)}")

	for lang, count in sorted(lang_counts.items()):
	print(f" {lang}: {count} files")

	return filtered_files

	# Execute download and processing
	test_files = download_and_process_drive_dataset()
	print(f"\n🎯 Total files ready for language detection: {len(test_files)}")


	# ==============================================================================
	# Cell 8: Execute Language Detection Analysis
	# ==============================================================================

	def run_language_detection_analysis(audio_files):
	"""Run complete language detection analysis"""

	if not audio_files:
	print("❌ No audio files to process")
	return

	print(f"🚀 Starting language detection on {len(audio_files)} files...")
	print("=" * 60)

	results = []

	for i, audio_path in enumerate(audio_files, 1):
	print(f"\n[{i}/{len(audio_files)}] Processing: {os.path.basename(audio_path)}")

	try:
	# Extract ground truth
	gt_iso = gt_from_filename(audio_path)

	# Run hybrid detection
	pred_iso, confidence = hybrid_language_detection(audio_path)

	# Determine correctness
	is_correct = (gt_iso == pred_iso) if gt_iso else None

	result = {
	"file": os.path.basename(audio_path),
	"full_path": audio_path,
	"gt_iso": gt_iso if gt_iso else "",
	"pred_iso": pred_iso,
	"confidence": confidence,
	"correct": is_correct
	}

	results.append(result)

	# Status display
	status = "✅" if is_correct else "❌" if is_correct is False else "❓"
	print(f" {status} GT: {gt_iso or 'Unknown'} \| Pred: {pred_iso} \| Conf: {confidence:.3f}")

	except Exception as e:
	print(f" 💥 Error processing file: {e}")
	results.append({
	"file": os.path.basename(audio_path),
	"full_path": audio_path,
	"gt_iso": "",
	"pred_iso": "error",
	"confidence": 0.0,
	"correct": False
	})

	return results

	# Run the analysis
	analysis_results = run_language_detection_analysis(test_files)
	print(f"\n🎉 Language detection analysis complete!")
	print(f"📊 Total results: {len(analysis_results)}")


	# ==============================================================================
	# Cell 9: Complete Results Analysis and Accuracy Report
	# ==============================================================================

	def generate_comprehensive_analysis(results):
	"""Generate complete analysis matching your dataset format"""

	df = pd.DataFrame(results)

	# Filter to files with ground truth from your dataset
	valid_df = df[(df["gt_iso"] != "") & (df["gt_iso"].isin(ALL_SUPPORTED_LANGS))].copy()

	if len(valid_df) == 0:
	print("❌ No valid ground truth files found")
	return

	print("📊 COMPREHENSIVE LANGUAGE DETECTION ANALYSIS")
	print("=" * 60)

	# Overall accuracy
	overall_acc = accuracy_score(valid_df["gt_iso"], valid_df["pred_iso"])
	print(f"🎯 OVERALL ACCURACY: {overall_acc:.4f} ({overall_acc*100:.1f}%)")

	# Create accuracy table matching your format
	print(f"\n📊 LANGUAGE-WISE ACCURACY:")
	print("-" * 60)
	print("Code \| Language Name \| Files \| Top-1 \| Top-5 \| Conf")
	print("-" * 60)

	# Language name mapping
	LANG_NAMES = {
	'ur': 'Urdu', 'pa': 'Punjabi', 'ta': 'Tamil', 'sd': 'Sindhi',
	'or': 'Odia', 'ml': 'Malayalam', 'ne': 'Nepali', 'as': 'Assamese',
	'hi': 'Hindi', 'bn': 'Bengali', 'kok': 'Konkani', 'kn': 'Kannada',
	'ks': 'Kashmiri', 'mr': 'Marathi', 'te': 'Telugu', 'br': 'Bodo',
	'doi': 'Dogri', 'sat': 'Santali', 'gu': 'Gujarati', 'mai': 'Maithili',
	'mni': 'Manipuri', 'sa': 'Sanskrit'
	}

	# Calculate per-language statistics
	lang_stats = []

	for lang_code in sorted(valid_df["gt_iso"].unique()):
	lang_data = valid_df[valid_df["gt_iso"] == lang_code]

	total_files = len(lang_data)
	correct_pred = (lang_data["gt_iso"] == lang_data["pred_iso"]).sum()
	accuracy = correct_pred / total_files
	avg_conf = lang_data["confidence"].mean()

	lang_name = LANG_NAMES.get(lang_code, lang_code.title())

	# Format output to match your table
	print(f"{lang_code:>3s} \| {lang_name:<15s} \| {total_files:>5d} \| {accuracy100:>5.1f}% \| {accuracy100:>5.1f}% \| {avg_conf:>5.3f}")

	lang_stats.append({
	'code': lang_code,
	'name': lang_name,
	'files': total_files,
	'accuracy': accuracy,
	'confidence': avg_conf
	})

	print("-" * 60)

	# Language family analysis
	print(f"\n📊 LANGUAGE FAMILY PERFORMANCE:")
	print("-" * 40)

	family_stats = {}
	for _, row in valid_df.iterrows():
	lang = row['gt_iso']
	correct = row['correct']

	if lang in INDO_ARYAN_LANGS:
	family = 'Indo-Aryan'
	elif lang in DRAVIDIAN_LANGS:
	family = 'Dravidian'
	elif lang in LOW_RESOURCE_LANGS:
	family = 'Low-Resource'
	else:
	family = 'Other'

	if family not in family_stats:
	family_stats[family] = {'correct': 0, 'total': 0}
	family_stats[family]['total'] += 1
	if correct:
	family_stats[family]['correct'] += 1

	for family, stats in family_stats.items():
	acc_pct = (stats['correct'] / stats['total']) * 100
	print(f"{family:<15s}: {acc_pct:>5.1f}% ({stats['correct']:>2d}/{stats['total']:>2d})")

	# Model performance analysis
	print(f"\n📊 MODEL PERFORMANCE:")
	print("-" * 30)
	print(f"Models loaded: {models_loaded}/2")
	print(f"VoxLingua107: {'✅ Active' if voxlingua_model else '❌ Failed'}")
	print(f"XLS-R: {'✅ Active' if xlsr_lid_model else '❌ Failed'}")

	# Error analysis
	errors = valid_df[valid_df["gt_iso"] != valid_df["pred_iso"]]
	if len(errors) > 0:
	print(f"\n❌ MISCLASSIFICATION ANALYSIS ({len(errors)} errors):")
	print("-" * 50)

	# Group errors by actual language
	for actual_lang in sorted(errors["gt_iso"].unique()):
	lang_errors = errors[errors["gt_iso"] == actual_lang]
	predicted_langs = lang_errors["pred_iso"].value_counts()

	print(f"{actual_lang} ({LANG_NAMES.get(actual_lang, actual_lang)}):")
	for pred_lang, count in predicted_langs.head(3).items():
	print(f" → {pred_lang} ({count} files)")

	# Summary statistics
	print(f"\n📈 SUMMARY STATISTICS:")
	print("-" * 25)
	print(f"Total files processed: {len(df)}")
	print(f"Files with valid GT: {len(valid_df)}")
	print(f"Languages detected: {len(valid_df['pred_iso'].unique())}")
	print(f"Languages in dataset: {len(valid_df['gt_iso'].unique())}")
	print(f"Perfect accuracy: {len([l for l in lang_stats if l['accuracy'] == 1.0])}")
	print(f"Above 90% accuracy: {len([l for l in lang_stats if l['accuracy'] >= 0.9])}")
	print(f"Below 50% accuracy: {len([l for l in lang_stats if l['accuracy'] < 0.5])}")

	return valid_df, lang_stats

	# Run comprehensive analysis
	if 'analysis_results' in globals() and analysis_results:
	final_df, language_statistics = generate_comprehensive_analysis(analysis_results)

	# Save results to CSV
	if 'final_df' in locals():
	timestamp = pd.Timestamp.now().strftime("%Y%m%d_%H%M%S")
	csv_filename = f"language_detection_results_{timestamp}.csv"
	final_df.to_csv(csv_filename, index=False)
	print(f"\n💾 Results saved to: {csv_filename}")

	# Download file
	try:
	from google.colab import files
	print("📥 File downloaded successfully")
	except:
	print("📁 File saved locally (download failed)")
	else:
	print("❌ No analysis results available. Please run the previous cells first.")

	print(f"\n✅ COMPLETE LANGUAGE DETECTION ANALYSIS FINISHED!")


	# ==============================================================================
	# Independent Model Analysis with Top-5 and Real Confidence Scores
	# ==============================================================================

	def analyze_models_independently(audio_files):
	"""Analyze each model independently with Top-5 predictions and real confidence scores"""

	print("🔍 INDEPENDENT MODEL ANALYSIS")
	print("=" * 60)

	results = {
	'voxlingua': [],
	'xlsr': [],
	'combined_analysis': []
	}

	for i, audio_path in enumerate(audio_files, 1):
	print(f"\n[{i}/{len(audio_files)}] Analyzing: {os.path.basename(audio_path)}")

	# Extract ground truth
	gt_iso = gt_from_filename(audio_path)
	print(f" Ground Truth: {gt_iso or 'Unknown'}")

	file_result = {
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'voxlingua_results': {},
	'xlsr_results': {}
	}

	# ========================================
	# VoxLingua107 Independent Analysis
	# ========================================
	if voxlingua_model is not None:
	try:
	print(f" 🔬 VoxLingua107 Analysis:")
	out = voxlingua_model.classify_file(audio_path)

	# Extract Top-5 predictions with real confidence scores
	logits, log_conf, pred_idx, labels = out

	# Get top 5 predictions
	top5_indices = torch.topk(logits.squeeze(), 5).indices
	top5_probs = torch.softmax(logits.squeeze(), dim=0)

	vox_top5 = []
	for idx in top5_indices:
	lang_label = labels[idx.item()] if idx.item() < len(labels) else f"idx_{idx.item()}"
	prob = top5_probs[idx.item()].item()

	# Extract language code
	if isinstance(lang_label, str):
	colon_pos = lang_label.find(":")
	lang_code = lang_label[:colon_pos].strip() if colon_pos != -1 else lang_label.strip()
	else:
	lang_code = str(lang_label)

	# Map to dataset codes
	mapped_lang = map_to_dataset_language(lang_code)

	vox_top5.append({
	'rank': len(vox_top5) + 1,
	'original_code': lang_code,
	'mapped_code': mapped_lang,
	'confidence': prob,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	print(f" Rank {len(vox_top5)}: {lang_code} → {mapped_lang} ({prob:.4f}) {'✅' if mapped_lang in ALL_SUPPORTED_LANGS else '❌'}")

	# Store VoxLingua results
	file_result['voxlingua_results'] = {
	'top5': vox_top5,
	'top1_original': vox_top5[0]['original_code'],
	'top1_mapped': vox_top5[0]['mapped_code'],
	'top1_confidence': vox_top5[0]['confidence'],
	'correct_in_top1': gt_iso == vox_top5[0]['mapped_code'] if gt_iso else None,
	'correct_in_top5': any(pred['mapped_code'] == gt_iso for pred in vox_top5) if gt_iso else None
	}

	results['voxlingua'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': vox_top5[0]['mapped_code'],
	'confidence': vox_top5[0]['confidence'],
	'correct': gt_iso == vox_top5[0]['mapped_code'] if gt_iso else None,
	'top5_predictions': [p['mapped_code'] for p in vox_top5]
	})

	except Exception as e:
	print(f" ❌ VoxLingua107 error: {e}")
	file_result['voxlingua_results'] = {'error': str(e)}

	# ========================================
	# XLS-R Independent Analysis
	# ========================================
	if xlsr_lid_model is not None:
	try:
	print(f" 🔬 XLS-R Analysis:")
	out = xlsr_lid_model.classify_file(audio_path)

	# Parse XLS-R output for Top-5
	out_prob, score, index, text_lab = out

	# Get top 5 predictions
	top5_indices = torch.topk(out_prob.squeeze(), 5).indices
	top5_probs = torch.softmax(out_prob.squeeze(), dim=0)

	xlsr_top5 = []
	for idx in top5_indices:
	lang_label = text_lab[idx.item()] if idx.item() < len(text_lab) else f"idx_{idx.item()}"
	prob = top5_probs[idx.item()].item()

	lang_code = str(lang_label).strip().lower()
	mapped_lang = map_to_dataset_language(lang_code)

	xlsr_top5.append({
	'rank': len(xlsr_top5) + 1,
	'original_code': lang_code,
	'mapped_code': mapped_lang,
	'confidence': prob,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	print(f" Rank {len(xlsr_top5)}: {lang_code} → {mapped_lang} ({prob:.4f}) {'✅' if mapped_lang in ALL_SUPPORTED_LANGS else '❌'}")

	# Store XLS-R results
	file_result['xlsr_results'] = {
	'top5': xlsr_top5,
	'top1_original': xlsr_top5[0]['original_code'],
	'top1_mapped': xlsr_top5[0]['mapped_code'],
	'top1_confidence': xlsr_top5[0]['confidence'],
	'correct_in_top1': gt_iso == xlsr_top5[0]['mapped_code'] if gt_iso else None,
	'correct_in_top5': any(pred['mapped_code'] == gt_iso for pred in xlsr_top5) if gt_iso else None
	}

	results['xlsr'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': xlsr_top5[0]['mapped_code'],
	'confidence': xlsr_top5[0]['confidence'],
	'correct': gt_iso == xlsr_top5[0]['mapped_code'] if gt_iso else None,
	'top5_predictions': [p['mapped_code'] for p in xlsr_top5]
	})

	except Exception as e:
	print(f" ❌ XLS-R error: {e}")
	file_result['xlsr_results'] = {'error': str(e)}

	results['combined_analysis'].append(file_result)

	print(f" ✅ Analysis complete for {os.path.basename(audio_path)}")

	return results

	def generate_independent_model_report(results):
	"""Generate comprehensive independent model analysis report"""

	print(f"\n📊 INDEPENDENT MODEL PERFORMANCE ANALYSIS")
	print("=" * 70)

	# VoxLingua107 Analysis
	if results['voxlingua']:
	vox_df = pd.DataFrame(results['voxlingua'])
	valid_vox = vox_df[vox_df['gt_iso'] != ''].copy()

	if len(valid_vox) > 0:
	vox_acc = accuracy_score(valid_vox['gt_iso'], valid_vox['pred_iso'])
	vox_conf_avg = valid_vox['confidence'].mean()
	vox_conf_std = valid_vox['confidence'].std()

	print(f"\n🔬 VoxLingua107 INDEPENDENT ANALYSIS:")
	print(f" Files analyzed: {len(valid_vox)}")
	print(f" Top-1 Accuracy: {vox_acc:.4f} ({vox_acc*100:.1f}%)")
	print(f" Avg Confidence: {vox_conf_avg:.4f} ± {vox_conf_std:.4f}")

	# Per-language accuracy for VoxLingua
	print(f" Per-language performance:")
	vox_per_lang = valid_vox.groupby('gt_iso').agg({
	'correct': 'mean',
	'confidence': ['mean', 'count']
	}).round(4)
	vox_per_lang.columns = ['accuracy', 'avg_conf', 'count']

	for lang, row in vox_per_lang.iterrows():
	print(f" {lang}: {row['accuracy']:.3f} ({row['accuracy']*100:.1f}%) - {row['avg_conf']:.3f} conf - {int(row['count'])} files")

	# XLS-R Analysis
	if results['xlsr']:
	xlsr_df = pd.DataFrame(results['xlsr'])
	valid_xlsr = xlsr_df[xlsr_df['gt_iso'] != ''].copy()

	if len(valid_xlsr) > 0:
	xlsr_acc = accuracy_score(valid_xlsr['gt_iso'], valid_xlsr['pred_iso'])
	xlsr_conf_avg = valid_xlsr['confidence'].mean()
	xlsr_conf_std = valid_xlsr['confidence'].std()

	print(f"\n🔬 XLS-R INDEPENDENT ANALYSIS:")
	print(f" Files analyzed: {len(valid_xlsr)}")
	print(f" Top-1 Accuracy: {xlsr_acc:.4f} ({xlsr_acc*100:.1f}%)")
	print(f" Avg Confidence: {xlsr_conf_avg:.4f} ± {xlsr_conf_std:.4f}")

	# Per-language accuracy for XLS-R
	print(f" Per-language performance:")
	xlsr_per_lang = valid_xlsr.groupby('gt_iso').agg({
	'correct': 'mean',
	'confidence': ['mean', 'count']
	}).round(4)
	xlsr_per_lang.columns = ['accuracy', 'avg_conf', 'count']

	for lang, row in xlsr_per_lang.iterrows():
	print(f" {lang}: {row['accuracy']:.3f} ({row['accuracy']*100:.1f}%) - {row['avg_conf']:.3f} conf - {int(row['count'])} files")

	# Model Comparison
	if results['voxlingua'] and results['xlsr']:
	print(f"\n⚖️ MODEL COMPARISON:")
	print(f" VoxLingua107 vs XLS-R:")
	print(f" Accuracy: {vox_acc:.4f} vs {xlsr_acc:.4f} ({'VoxLingua wins' if vox_acc > xlsr_acc else 'XLS-R wins' if xlsr_acc > vox_acc else 'Tie'})")
	print(f" Avg Confidence: {vox_conf_avg:.4f} vs {xlsr_conf_avg:.4f}")

	# Suggest optimal weights
	total_perf = vox_acc + xlsr_acc
	vox_weight = vox_acc / total_perf if total_perf > 0 else 0.5
	xlsr_weight = xlsr_acc / total_perf if total_perf > 0 else 0.5

	print(f"\n💡 SUGGESTED OPTIMAL WEIGHTS:")
	print(f" VoxLingua107: {vox_weight:.2f} ({vox_weight*100:.0f}%)")
	print(f" XLS-R: {xlsr_weight:.2f} ({xlsr_weight*100:.0f}%)")

	return results

	# Run independent analysis
	if 'test_files' in globals() and test_files:
	independent_results = analyze_models_independently(test_files[:10]) # Limit to first 10 for testing
	final_report = generate_independent_model_report(independent_results)
	else:
	print("❌ No test files available. Run the previous cells first.")


	# ==============================================================================
	# Analyze Already Downloaded Files in /content/drive_dataset/
	# ==============================================================================

	def scan_downloaded_files():
	"""Scan and collect already downloaded audio files"""

	download_dir = "/content/drive_dataset"

	if not os.path.exists(download_dir):
	print("❌ Download directory not found")
	return []

	print(f"🔍 Scanning {download_dir} for audio files...")

	# Valid audio extensions
	VALID_EXTS = {".wav", ".mp3", ".flac", ".m4a", ".ogg"}

	def is_audio(filepath):
	return os.path.splitext(filepath)[1].lower() in VALID_EXTS

	# Collect all audio files
	audio_files = []
	lang_counts = {}

	for root, dirs, files in os.walk(download_dir):
	for file in files:
	if is_audio(file):
	full_path = os.path.join(root, file)
	audio_files.append(full_path)

	# Extract language from folder structure
	path_parts = root.split('/')
	for part in path_parts:
	if len(part) in [2, 3] and part.isalpha():
	lang_counts[part] = lang_counts.get(part, 0) + 1
	break

	print(f"📊 Found {len(audio_files)} audio files:")
	for lang, count in sorted(lang_counts.items()):
	print(f" {lang}: {count} files")

	# Show sample files
	print(f"\n📝 Sample files:")
	for file_path in audio_files[:5]:
	print(f" {file_path}")

	return audio_files

	# Scan for downloaded files
	downloaded_files = scan_downloaded_files()

	if not downloaded_files:
	print("❌ No audio files found. Let me help you collect them manually.")

	# Manual file collection if scan fails
	print("\n🔍 Manual file search...")
	import glob

	# Search patterns for common locations
	search_patterns = [
	"/content/drive_dataset/*/.flac",
	"/content/drive_dataset/*/.wav",
	"/content/drive_dataset/*/.mp3",
	"/content/*/.flac",
	"/content/*/.wav",
	"/content/*/.mp3"
	]

	manual_files = []
	for pattern in search_patterns:
	found = glob.glob(pattern, recursive=True)
	manual_files.extend(found)

	# Remove duplicates
	manual_files = list(set(manual_files))

	print(f"📊 Manual search found: {len(manual_files)} files")
	for file_path in manual_files[:10]: # Show first 10
	print(f" {file_path}")

	downloaded_files = manual_files

	print(f"\n🎯 Total files ready for analysis: {len(downloaded_files)}")


	# ==============================================================================
	# Run Independent Analysis on Downloaded Files
	# ==============================================================================

	def analyze_downloaded_files_independently(audio_files):
	"""Run independent model analysis on downloaded files with detailed output"""

	if not audio_files:
	print("❌ No audio files to analyze")
	return None

	print(f"🚀 Starting independent analysis on {len(audio_files)} files...")
	print("=" * 70)

	results = {
	'voxlingua_detailed': [],
	'xlsr_detailed': [],
	'comparison_data': []
	}

	for i, audio_path in enumerate(audio_files, 1):
	print(f"\n[{i}/{len(audio_files)}] 🎵 {os.path.basename(audio_path)}")

	# Extract ground truth from path/filename
	gt_iso = gt_from_filename(audio_path)
	print(f" 📁 Ground Truth: {gt_iso or 'Unknown'}")

	file_analysis = {
	'file': os.path.basename(audio_path),
	'full_path': audio_path,
	'gt_iso': gt_iso or '',
	'voxlingua': {'available': False},
	'xlsr': {'available': False}
	}

	# ==========================================
	# VoxLingua107 Independent Analysis
	# ==========================================
	if voxlingua_model is not None:
	try:
	print(f" 🔬 VoxLingua107 Analysis:")
	out = voxlingua_model.classify_file(audio_path)
	logits, log_conf, pred_idx, labels = out

	# Get real confidence scores (not weighted)
	probs = torch.softmax(logits.squeeze(), dim=0)
	top5_indices = torch.topk(probs, min(5, len(probs))).indices

	vox_predictions = []
	for rank, idx in enumerate(top5_indices, 1):
	lang_label = labels[idx.item()]
	confidence = probs[idx.item()].item()

	# Parse language code
	if isinstance(lang_label, str):
	colon_pos = lang_label.find(":")
	lang_code = lang_label[:colon_pos].strip() if colon_pos != -1 else lang_label.strip()
	else:
	lang_code = str(lang_label)

	# Map to dataset language
	mapped_lang = map_to_dataset_language(lang_code)

	vox_predictions.append({
	'rank': rank,
	'original': lang_code,
	'mapped': mapped_lang,
	'confidence': confidence,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	status = "✅" if mapped_lang in ALL_SUPPORTED_LANGS else "❌"
	print(f" #{rank}: {lang_code} → {mapped_lang} ({confidence:.4f}) {status}")

	# Store VoxLingua results
	top1 = vox_predictions[0]
	file_analysis['voxlingua'] = {
	'available': True,
	'top5_predictions': vox_predictions,
	'top1_prediction': top1['mapped'],
	'top1_confidence': top1['confidence'],
	'correct_top1': gt_iso == top1['mapped'] if gt_iso else None,
	'correct_in_top5': any(p['mapped'] == gt_iso for p in vox_predictions) if gt_iso else None
	}

	results['voxlingua_detailed'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': top1['mapped'],
	'confidence': top1['confidence'],
	'correct': gt_iso == top1['mapped'] if gt_iso else None
	})

	except Exception as e:
	print(f" ❌ VoxLingua107 error: {e}")
	file_analysis['voxlingua'] = {'available': False, 'error': str(e)}

	# ==========================================
	# XLS-R Independent Analysis
	# ==========================================
	if xlsr_lid_model is not None:
	try:
	print(f" 🔬 XLS-R Analysis:")
	out = xlsr_lid_model.classify_file(audio_path)
	out_prob, score, index, text_lab = out

	# Get real confidence scores
	probs = torch.softmax(out_prob.squeeze(), dim=0)
	top5_indices = torch.topk(probs, min(5, len(probs))).indices

	xlsr_predictions = []
	for rank, idx in enumerate(top5_indices, 1):
	lang_label = text_lab[idx.item()]
	confidence = probs[idx.item()].item()

	lang_code = str(lang_label).strip().lower()
	mapped_lang = map_to_dataset_language(lang_code)

	xlsr_predictions.append({
	'rank': rank,
	'original': lang_code,
	'mapped': mapped_lang,
	'confidence': confidence,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	status = "✅" if mapped_lang in ALL_SUPPORTED_LANGS else "❌"
	print(f" #{rank}: {lang_code} → {mapped_lang} ({confidence:.4f}) {status}")

	# Store XLS-R results
	top1 = xlsr_predictions[0]
	file_analysis['xlsr'] = {
	'available': True,
	'top5_predictions': xlsr_predictions,
	'top1_prediction': top1['mapped'],
	'top1_confidence': top1['confidence'],
	'correct_top1': gt_iso == top1['mapped'] if gt_iso else None,
	'correct_in_top5': any(p['mapped'] == gt_iso for p in xlsr_predictions) if gt_iso else None
	}

	results['xlsr_detailed'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': top1['mapped'],
	'confidence': top1['confidence'],
	'correct': gt_iso == top1['mapped'] if gt_iso else None
	})

	except Exception as e:
	print(f" ❌ XLS-R error: {e}")
	file_analysis['xlsr'] = {'available': False, 'error': str(e)}

	results['comparison_data'].append(file_analysis)
	print(f" ✅ Analysis complete\n")

	return results

	# Run the independent analysis
	if downloaded_files:
	print("🔬 Running independent model analysis...")
	analysis_results = analyze_downloaded_files_independently(downloaded_files)
	else:
	print("❌ No files found for analysis")
	analysis_results = None


	# ==============================================================================
	# FIXED: Robust VoxLingua107 Analysis with Better Error Handling
	# ==============================================================================

	def parse_voxlingua_output_robust(out):
	"""Robust parsing of VoxLingua107 output with multiple fallback methods"""

	try:
	# Method 1: Standard SpeechBrain output format
	if isinstance(out, (tuple, list)) and len(out) >= 4:
	logits, log_conf, pred_idx, labels = out[:4]

	# Validate components
	if hasattr(logits, 'squeeze') and hasattr(labels, '__getitem__'):
	return logits, log_conf, pred_idx, labels, "standard"

	# Method 2: Alternative format (sometimes returns dict)
	if isinstance(out, dict):
	logits = out.get('predictions', out.get('logits'))
	labels = out.get('labels', out.get('text_lab'))
	log_conf = out.get('log_probabilities', out.get('log_conf'))
	pred_idx = out.get('predicted_ids', out.get('pred_idx'))

	if all(v is not None for v in [logits, labels]):
	return logits, log_conf, pred_idx, labels, "dict"

	# Method 3: Direct tensor output
	if hasattr(out, 'squeeze'): # Direct logits tensor
	logits = out
	# Create dummy labels based on logits size
	labels = [f"lang_{i}" for i in range(logits.shape[-1])]
	log_conf = torch.log_softmax(logits, dim=-1).max()
	pred_idx = torch.argmax(logits, dim=-1)

	return logits, log_conf, pred_idx, labels, "tensor"

	except Exception as e:
	print(f" Parse error: {e}")

	return None, None, None, None, "failed"

	def analyze_voxlingua_robust(audio_path):
	"""Robust VoxLingua107 analysis with multiple parsing methods"""

	if voxlingua_model is None:
	return None

	try:
	# Get raw output from model
	raw_out = voxlingua_model.classify_file(audio_path)

	# Parse with robust method
	logits, log_conf, pred_idx, labels, parse_method = parse_voxlingua_output_robust(raw_out)

	if logits is None:
	print(f" ❌ Could not parse VoxLingua output format")
	return None

	print(f" 📊 Parse method: {parse_method}")

	# Get predictions based on available data
	if hasattr(logits, 'squeeze'):
	probs = torch.softmax(logits.squeeze(), dim=-1 if len(logits.squeeze().shape) > 0 else 0)

	# Handle different tensor shapes
	if len(probs.shape) == 0: # Scalar
	top_indices = torch.tensor([0])
	top_probs = probs.unsqueeze(0)
	else: # Vector
	k = min(5, len(probs))
	top_probs, top_indices = torch.topk(probs, k)
	else:
	print(f" ❌ Logits not in expected tensor format")
	return None

	predictions = []
	for rank, (idx, prob) in enumerate(zip(top_indices, top_probs), 1):
	idx_val = idx.item() if hasattr(idx, 'item') else int(idx)
	prob_val = prob.item() if hasattr(prob, 'item') else float(prob)

	# Get language label safely
	if idx_val < len(labels):
	lang_label = labels[idx_val]
	else:
	lang_label = f"unknown_{idx_val}"

	# Parse language code
	if isinstance(lang_label, str):
	colon_pos = lang_label.find(":")
	lang_code = lang_label[:colon_pos].strip() if colon_pos != -1 else lang_label.strip()
	else:
	lang_code = str(lang_label)

	# Map to dataset language
	mapped_lang = map_to_dataset_language(lang_code)

	predictions.append({
	'rank': rank,
	'original': lang_code,
	'mapped': mapped_lang,
	'confidence': prob_val,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	status = "✅" if mapped_lang in ALL_SUPPORTED_LANGS else "❌"
	print(f" #{rank}: {lang_code} → {mapped_lang} ({prob_val:.4f}) {status}")

	return predictions

	except Exception as e:
	print(f" ❌ VoxLingua analysis error: {e}")
	print(f" ❌ Error type: {type(e).__name__}")
	return None

	def analyze_xlsr_robust(audio_path):
	"""Robust XLS-R analysis"""

	if xlsr_lid_model is None:
	return None

	try:
	raw_out = xlsr_lid_model.classify_file(audio_path)

	# Handle different XLS-R output formats
	if isinstance(raw_out, (tuple, list)) and len(raw_out) >= 4:
	out_prob, score, index, text_lab = raw_out[:4]
	else:
	print(f" ❌ XLS-R output format not recognized")
	return None

	# Get top predictions
	if hasattr(out_prob, 'squeeze'):
	probs = torch.softmax(out_prob.squeeze(), dim=-1 if len(out_prob.squeeze().shape) > 0 else 0)

	if len(probs.shape) == 0: # Scalar
	top_indices = torch.tensor([0])
	top_probs = probs.unsqueeze(0)
	else: # Vector
	k = min(5, len(probs))
	top_probs, top_indices = torch.topk(probs, k)
	else:
	print(f" ❌ XLS-R probabilities not in expected format")
	return None

	predictions = []
	for rank, (idx, prob) in enumerate(zip(top_indices, top_probs), 1):
	idx_val = idx.item() if hasattr(idx, 'item') else int(idx)
	prob_val = prob.item() if hasattr(prob, 'item') else float(prob)

	# Get language label
	if idx_val < len(text_lab):
	lang_label = text_lab[idx_val]
	else:
	lang_label = f"unknown_{idx_val}"

	lang_code = str(lang_label).strip().lower()
	mapped_lang = map_to_dataset_language(lang_code)

	predictions.append({
	'rank': rank,
	'original': lang_code,
	'mapped': mapped_lang,
	'confidence': prob_val,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	status = "✅" if mapped_lang in ALL_SUPPORTED_LANGS else "❌"
	print(f" #{rank}: {lang_code} → {mapped_lang} ({prob_val:.4f}) {status}")

	return predictions

	except Exception as e:
	print(f" ❌ XLS-R analysis error: {e}")
	return None

	# ==============================================================================
	# UPDATED: Robust Analysis Function
	# ==============================================================================

	def analyze_downloaded_files_robust(audio_files):
	"""Robust analysis with better error handling"""

	if not audio_files:
	print("❌ No audio files to analyze")
	return None

	print(f"🚀 Starting ROBUST analysis on {len(audio_files)} files...")
	print("=" * 70)

	results = {
	'voxlingua_detailed': [],
	'xlsr_detailed': [],
	'comparison_data': []
	}

	for i, audio_path in enumerate(audio_files, 1):
	print(f"\n[{i}/{len(audio_files)}] 🎵 {os.path.basename(audio_path)}")

	# Extract ground truth
	gt_iso = gt_from_filename(audio_path)
	print(f" 📁 Ground Truth: {gt_iso or 'Unknown'}")

	file_analysis = {
	'file': os.path.basename(audio_path),
	'full_path': audio_path,
	'gt_iso': gt_iso or '',
	'voxlingua': {'available': False},
	'xlsr': {'available': False}
	}

	# VoxLingua107 Analysis
	print(f" 🔬 VoxLingua107 Analysis:")
	vox_predictions = analyze_voxlingua_robust(audio_path)

	if vox_predictions:
	top1 = vox_predictions[0]
	file_analysis['voxlingua'] = {
	'available': True,
	'top5_predictions': vox_predictions,
	'top1_prediction': top1['mapped'],
	'top1_confidence': top1['confidence'],
	'correct_top1': gt_iso == top1['mapped'] if gt_iso else None,
	'correct_in_top5': any(p['mapped'] == gt_iso for p in vox_predictions) if gt_iso else None
	}

	results['voxlingua_detailed'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': top1['mapped'],
	'confidence': top1['confidence'],
	'correct': gt_iso == top1['mapped'] if gt_iso else None
	})
	else:
	file_analysis['voxlingua'] = {'available': False, 'error': 'Analysis failed'}

	# XLS-R Analysis
	print(f" 🔬 XLS-R Analysis:")
	xlsr_predictions = analyze_xlsr_robust(audio_path)

	if xlsr_predictions:
	top1 = xlsr_predictions[0]
	file_analysis['xlsr'] = {
	'available': True,
	'top5_predictions': xlsr_predictions,
	'top1_prediction': top1['mapped'],
	'top1_confidence': top1['confidence'],
	'correct_top1': gt_iso == top1['mapped'] if gt_iso else None,
	'correct_in_top5': any(p['mapped'] == gt_iso for p in xlsr_predictions) if gt_iso else None
	}

	results['xlsr_detailed'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': top1['mapped'],
	'confidence': top1['confidence'],
	'correct': gt_iso == top1['mapped'] if gt_iso else None
	})
	else:
	file_analysis['xlsr'] = {'available': False, 'error': 'Analysis failed'}

	results['comparison_data'].append(file_analysis)
	print(f" ✅ Analysis complete")

	return results

	# Run the robust analysis
	if 'downloaded_files' in globals() and downloaded_files:
	print("🔬 Running ROBUST independent model analysis...")
	robust_analysis_results = analyze_downloaded_files_robust(downloaded_files)

	# Generate report
	if robust_analysis_results:
	generate_detailed_performance_report(robust_analysis_results)
	print(f"\n✅ ROBUST ANALYSIS COMPLETE!")
	else:
	print("❌ Robust analysis failed")
	else:
	print("❌ No downloaded files found. Please run the file scanning code first.")


	# ==============================================================================
	# COMPLETE FIX: VoxLingua Label Mapping + Missing Function
	# ==============================================================================

	# First, let's create a proper VoxLingua language mapping
	VOXLINGUA_LANGUAGE_MAP = {
	0: 'ab', 1: 'af', 2: 'ak', 3: 'am', 4: 'ar', 5: 'as', 6: 'az', 7: 'be', 8: 'bg', 9: 'bn',
	10: 'bo', 11: 'br', 12: 'bs', 13: 'ca', 14: 'ce', 15: 'co', 16: 'cs', 17: 'cv', 18: 'cy', 19: 'da',
	20: 'de', 21: 'dv', 22: 'dz', 23: 'ee', 24: 'el', 25: 'en', 26: 'eo', 27: 'es', 28: 'et', 29: 'eu',
	30: 'fa', 31: 'ff', 32: 'fi', 33: 'fo', 34: 'fr', 35: 'fy', 36: 'ga', 37: 'gd', 38: 'gl', 39: 'gn',
	40: 'gu', 41: 'gv', 42: 'ha', 43: 'haw', 44: 'he', 45: 'hi', 46: 'hr', 47: 'ht', 48: 'hu', 49: 'hy',
	50: 'ia', 51: 'id', 52: 'ie', 53: 'ig', 54: 'ii', 55: 'ik', 56: 'io', 57: 'is', 58: 'it', 59: 'iu',
	60: 'ja', 61: 'jv', 62: 'ka', 63: 'kk', 64: 'kl', 65: 'km', 66: 'kn', 67: 'ko', 68: 'ks', 69: 'ku',
	70: 'kw', 71: 'ky', 72: 'la', 73: 'lb', 74: 'lg', 75: 'li', 76: 'ln', 77: 'lo', 78: 'lt', 79: 'lv',
	80: 'mg', 81: 'mi', 82: 'mk', 83: 'ml', 84: 'mn', 85: 'mr', 86: 'ms', 87: 'mt', 88: 'my', 89: 'na',
	90: 'nb', 91: 'nd', 92: 'ne', 93: 'ng', 94: 'nl', 95: 'nn', 96: 'no', 97: 'nv', 98: 'ny', 99: 'oc',
	100: 'of', 101: 'om', 102: 'or', 103: 'os', 104: 'pa', 105: 'pi', 106: 'pl', 107: 'ps'
	}

	def get_voxlingua_language_by_index(idx):
	"""Map VoxLingua index to language code"""
	return VOXLINGUA_LANGUAGE_MAP.get(idx, f'unknown_{idx}')

	def analyze_voxlingua_fixed(audio_path):
	"""Fixed VoxLingua107 analysis with proper language mapping"""

	if voxlingua_model is None:
	return None

	try:
	raw_out = voxlingua_model.classify_file(audio_path)

	if not isinstance(raw_out, (tuple, list)) or len(raw_out) < 4:
	print(f" ❌ Unexpected VoxLingua output format")
	return None

	logits, log_conf, pred_idx, labels = raw_out[:4]

	# Get probabilities and top 5
	probs = torch.softmax(logits.squeeze(), dim=-1)
	k = min(5, len(probs))
	top_probs, top_indices = torch.topk(probs, k)

	predictions = []
	for rank, (idx, prob) in enumerate(zip(top_indices, top_probs), 1):
	idx_val = idx.item() if hasattr(idx, 'item') else int(idx)
	prob_val = prob.item() if hasattr(prob, 'item') else float(prob)

	# Method 1: Try to use provided labels
	if idx_val < len(labels) and not str(labels[idx_val]).startswith('unknown'):
	lang_label = labels[idx_val]
	if isinstance(lang_label, str):
	colon_pos = lang_label.find(":")
	lang_code = lang_label[:colon_pos].strip() if colon_pos != -1 else lang_label.strip()
	else:
	lang_code = str(lang_label)
	else:
	# Method 2: Use our language mapping
	lang_code = get_voxlingua_language_by_index(idx_val)

	# Map to dataset language
	mapped_lang = map_to_dataset_language(lang_code)

	predictions.append({
	'rank': rank,
	'original': lang_code,
	'mapped': mapped_lang,
	'confidence': prob_val,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS,
	'index': idx_val
	})

	status = "✅" if mapped_lang in ALL_SUPPORTED_LANGS else "❌"
	print(f" #{rank}: {lang_code} → {mapped_lang} ({prob_val:.4f}) {status} [idx:{idx_val}]")

	return predictions

	except Exception as e:
	print(f" ❌ VoxLingua analysis error: {e}")
	return None

	def analyze_xlsr_fixed(audio_path):
	"""Fixed XLS-R analysis"""

	if xlsr_lid_model is None:
	print(f" ❌ XLS-R model not loaded")
	return None

	try:
	raw_out = xlsr_lid_model.classify_file(audio_path)

	if not isinstance(raw_out, (tuple, list)) or len(raw_out) < 4:
	print(f" ❌ Unexpected XLS-R output format")
	return None

	out_prob, score, index, text_lab = raw_out[:4]

	# Get probabilities and top 5
	probs = torch.softmax(out_prob.squeeze(), dim=-1)
	k = min(5, len(probs))
	top_probs, top_indices = torch.topk(probs, k)

	predictions = []
	for rank, (idx, prob) in enumerate(zip(top_indices, top_probs), 1):
	idx_val = idx.item() if hasattr(idx, 'item') else int(idx)
	prob_val = prob.item() if hasattr(prob, 'item') else float(prob)

	# Get language label
	if idx_val < len(text_lab):
	lang_label = text_lab[idx_val]
	lang_code = str(lang_label).strip().lower()
	else:
	lang_code = f"xlsr_unknown_{idx_val}"

	mapped_lang = map_to_dataset_language(lang_code)

	predictions.append({
	'rank': rank,
	'original': lang_code,
	'mapped': mapped_lang,
	'confidence': prob_val,
	'in_dataset': mapped_lang in ALL_SUPPORTED_LANGS
	})

	status = "✅" if mapped_lang in ALL_SUPPORTED_LANGS else "❌"
	print(f" #{rank}: {lang_code} → {mapped_lang} ({prob_val:.4f}) {status}")

	return predictions

	except Exception as e:
	print(f" ❌ XLS-R analysis error: {e}")
	return None

	def generate_detailed_performance_report(results):
	"""Complete performance analysis report function"""

	if not results:
	print("❌ No results to analyze")
	return

	print("\n📊 DETAILED INDEPENDENT MODEL PERFORMANCE REPORT")
	print("=" * 70)

	# VoxLingua107 Performance Analysis
	if results['voxlingua_detailed']:
	vox_df = pd.DataFrame(results['voxlingua_detailed'])
	valid_vox = vox_df[vox_df['gt_iso'] != ''].copy()

	print(f"\n🔬 VOXLINGUA107 PERFORMANCE:")
	print("-" * 40)

	if len(valid_vox) > 0:
	vox_acc = (valid_vox['correct'] == True).mean()
	vox_conf_mean = valid_vox['confidence'].mean()
	vox_conf_std = valid_vox['confidence'].std()

	print(f"Files Analyzed: {len(valid_vox)}")
	print(f"Top-1 Accuracy: {vox_acc:.4f} ({vox_acc*100:.1f}%)")
	print(f"Confidence: {vox_conf_mean:.4f} ± {vox_conf_std:.4f}")

	# Per-language breakdown
	print(f"\nPer-Language Performance:")
	for lang in sorted(valid_vox['gt_iso'].unique()):
	lang_data = valid_vox[valid_vox['gt_iso'] == lang]
	acc = (lang_data['correct'] == True).mean()
	conf_mean = lang_data['confidence'].mean()
	count = len(lang_data)
	print(f" {lang:>3}: {acc:.3f} ({acc*100:5.1f}%) \| Conf: {conf_mean:.3f} \| n={count}")
	else:
	print("No valid VoxLingua results")

	# XLS-R Performance Analysis
	if results['xlsr_detailed']:
	xlsr_df = pd.DataFrame(results['xlsr_detailed'])
	valid_xlsr = xlsr_df[xlsr_df['gt_iso'] != ''].copy()

	print(f"\n🔬 XLS-R PERFORMANCE:")
	print("-" * 40)

	if len(valid_xlsr) > 0:
	xlsr_acc = (valid_xlsr['correct'] == True).mean()
	xlsr_conf_mean = valid_xlsr['confidence'].mean()
	xlsr_conf_std = valid_xlsr['confidence'].std()

	print(f"Files Analyzed: {len(valid_xlsr)}")
	print(f"Top-1 Accuracy: {xlsr_acc:.4f} ({xlsr_acc*100:.1f}%)")
	print(f"Confidence: {xlsr_conf_mean:.4f} ± {xlsr_conf_std:.4f}")

	# Per-language breakdown
	print(f"\nPer-Language Performance:")
	for lang in sorted(valid_xlsr['gt_iso'].unique()):
	lang_data = valid_xlsr[valid_xlsr['gt_iso'] == lang]
	acc = (lang_data['correct'] == True).mean()
	conf_mean = lang_data['confidence'].mean()
	count = len(lang_data)
	print(f" {lang:>3}: {acc:.3f} ({acc*100:5.1f}%) \| Conf: {conf_mean:.3f} \| n={count}")
	else:
	print("No valid XLS-R results")

	# Model Comparison
	if results['voxlingua_detailed'] and results['xlsr_detailed']:
	print(f"\n⚖️ MODEL COMPARISON:")
	print("-" * 30)

	print(f"VoxLingua107: {vox_acc:.4f} accuracy")
	print(f"XLS-R: {xlsr_acc:.4f} accuracy")

	# Calculate optimal weights
	total_acc = vox_acc + xlsr_acc
	if total_acc > 0:
	vox_weight = vox_acc / total_acc
	xlsr_weight = xlsr_acc / total_acc

	print(f"\n💡 RECOMMENDED WEIGHTS:")
	print(f"VoxLingua107: {vox_weight:.3f} ({vox_weight*100:.1f}%)")
	print(f"XLS-R: {xlsr_weight:.3f} ({xlsr_weight*100:.1f}%)")

	# Calculate agreement
	vox_preds = set(vox_df['pred_iso'].tolist())
	xlsr_preds = set(xlsr_df['pred_iso'].tolist())
	common_preds = vox_preds.intersection(xlsr_preds)

	print(f"\nModel Agreement Analysis:")
	print(f"Common predictions: {len(common_preds)}")
	print(f"VoxLingua unique: {len(vox_preds - xlsr_preds)}")
	print(f"XLS-R unique: {len(xlsr_preds - vox_preds)}")

	# Save results
	timestamp = pd.Timestamp.now().strftime("%Y%m%d_%H%M%S")

	if results['voxlingua_detailed']:
	vox_csv = f"voxlingua_fixed_results_{timestamp}.csv"
	pd.DataFrame(results['voxlingua_detailed']).to_csv(vox_csv, index=False)
	print(f"\n💾 VoxLingua results: {vox_csv}")

	if results['xlsr_detailed']:
	xlsr_csv = f"xlsr_fixed_results_{timestamp}.csv"
	pd.DataFrame(results['xlsr_detailed']).to_csv(xlsr_csv, index=False)
	print(f"💾 XLS-R results: {xlsr_csv}")

	def run_complete_fixed_analysis(audio_files):
	"""Run complete analysis with all fixes"""

	if not audio_files:
	print("❌ No audio files to analyze")
	return None

	print(f"🚀 Starting COMPLETE FIXED analysis on {len(audio_files)} files...")
	print("=" * 70)

	results = {
	'voxlingua_detailed': [],
	'xlsr_detailed': [],
	'comparison_data': []
	}

	for i, audio_path in enumerate(audio_files, 1):
	print(f"\n[{i}/{len(audio_files)}] 🎵 {os.path.basename(audio_path)}")

	# Extract ground truth
	gt_iso = gt_from_filename(audio_path)
	print(f" 📁 Ground Truth: {gt_iso or 'Unknown'}")

	file_analysis = {
	'file': os.path.basename(audio_path),
	'full_path': audio_path,
	'gt_iso': gt_iso or '',
	'voxlingua': {'available': False},
	'xlsr': {'available': False}
	}

	# VoxLingua107 Analysis
	print(f" 🔬 VoxLingua107 Analysis:")
	vox_predictions = analyze_voxlingua_fixed(audio_path)

	if vox_predictions and len(vox_predictions) > 0:
	top1 = vox_predictions[0]
	file_analysis['voxlingua'] = {
	'available': True,
	'top5_predictions': vox_predictions,
	'top1_prediction': top1['mapped'],
	'top1_confidence': top1['confidence'],
	'correct_top1': gt_iso == top1['mapped'] if gt_iso else None,
	}

	results['voxlingua_detailed'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': top1['mapped'],
	'confidence': top1['confidence'],
	'correct': gt_iso == top1['mapped'] if gt_iso else None
	})

	# XLS-R Analysis
	print(f" 🔬 XLS-R Analysis:")
	xlsr_predictions = analyze_xlsr_fixed(audio_path)

	if xlsr_predictions and len(xlsr_predictions) > 0:
	top1 = xlsr_predictions[0]
	file_analysis['xlsr'] = {
	'available': True,
	'top5_predictions': xlsr_predictions,
	'top1_prediction': top1['mapped'],
	'top1_confidence': top1['confidence'],
	'correct_top1': gt_iso == top1['mapped'] if gt_iso else None,
	}

	results['xlsr_detailed'].append({
	'file': os.path.basename(audio_path),
	'gt_iso': gt_iso or '',
	'pred_iso': top1['mapped'],
	'confidence': top1['confidence'],
	'correct': gt_iso == top1['mapped'] if gt_iso else None
	})

	results['comparison_data'].append(file_analysis)
	print(f" ✅ Analysis complete")

	return results

	# Run the complete fixed analysis
	if 'downloaded_files' in globals() and downloaded_files:
	print("🔬 Running COMPLETE FIXED analysis...")
	final_analysis_results = run_complete_fixed_analysis(downloaded_files)

	if final_analysis_results:
	generate_detailed_performance_report(final_analysis_results)
	print(f"\n✅ COMPLETE FIXED ANALYSIS DONE!")
	else:
	print("❌ Analysis failed")
	else:
	print("❌ No downloaded files found")


	# ==============================================================================
	# COMPREHENSIVE EXCEL ANALYSIS WITH ALL DETAILS
	# ==============================================================================

	import pandas as pd
	import numpy as np
	from datetime import datetime
	import os

	def create_comprehensive_excel_analysis(results, output_filename=None):
	"""Create comprehensive Excel analysis with multiple sheets and detailed metrics"""

	if not results:
	print("❌ No results to analyze")
	return None

	# Generate filename if not provided
	if not output_filename:
	timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
	output_filename = f"Language_Detection_Comprehensive_Analysis_{timestamp}.xlsx"

	print(f"📊 Creating comprehensive Excel analysis: {output_filename}")

	# Create Excel writer
	with pd.ExcelWriter(output_filename, engine='openpyxl') as writer:

	# ========================================
	# SHEET 1: EXECUTIVE SUMMARY
	# ========================================
	print(" 📋 Creating Executive Summary...")

	summary_data = []

	# Overall statistics
	total_files = len(results['comparison_data'])
	vox_available = sum(1 for item in results['comparison_data'] if item['voxlingua']['available'])
	xlsr_available = sum(1 for item in results['comparison_data'] if item['xlsr']['available'])

	summary_data.extend([
	['EXECUTIVE SUMMARY', ''],
	['Analysis Date', datetime.now().strftime("%Y-%m-%d %H:%M:%S")],
	['Total Files Analyzed', total_files],
	['VoxLingua107 Available', f"{vox_available} ({vox_available/total_files*100:.1f}%)"],
	['XLS-R Available', f"{xlsr_available} ({xlsr_available/total_files*100:.1f}%)"],
	['', ''],
	])

	# Model performance summary
	if results['voxlingua_detailed']:
	vox_df = pd.DataFrame(results['voxlingua_detailed'])
	valid_vox = vox_df[vox_df['gt_iso'] != ''].copy()
	if len(valid_vox) > 0:
	vox_acc = (valid_vox['correct'] == True).mean()
	vox_conf = valid_vox['confidence'].mean()
	summary_data.extend([
	['VOXLINGUA107 PERFORMANCE', ''],
	['Accuracy', f"{vox_acc:.4f} ({vox_acc*100:.1f}%)"],
	['Average Confidence', f"{vox_conf:.4f}"],
	['Files with Valid GT', len(valid_vox)],
	['', ''],
	])

	if results['xlsr_detailed']:
	xlsr_df = pd.DataFrame(results['xlsr_detailed'])
	valid_xlsr = xlsr_df[xlsr_df['gt_iso'] != ''].copy()
	if len(valid_xlsr) > 0:
	xlsr_acc = (valid_xlsr['correct'] == True).mean()
	xlsr_conf = valid_xlsr['confidence'].mean()
	summary_data.extend([
	['XLS-R PERFORMANCE', ''],
	['Accuracy', f"{xlsr_acc:.4f} ({xlsr_acc*100:.1f}%)"],
	['Average Confidence', f"{xlsr_conf:.4f}"],
	['Files with Valid GT', len(valid_xlsr)],
	['', ''],
	])

	# Optimal weights calculation
	if results['voxlingua_detailed']:
	total_acc = vox_acc + xlsr_acc
	if total_acc > 0:
	vox_weight = vox_acc / total_acc
	xlsr_weight = xlsr_acc / total_acc
	summary_data.extend([
	['RECOMMENDED ENSEMBLE WEIGHTS', ''],
	['VoxLingua107 Weight', f"{vox_weight:.3f} ({vox_weight*100:.1f}%)"],
	['XLS-R Weight', f"{xlsr_weight:.3f} ({xlsr_weight*100:.1f}%)"],
	])

	# Create summary dataframe
	summary_df = pd.DataFrame(summary_data, columns=['Metric', 'Value'])
	summary_df.to_excel(writer, sheet_name='Executive_Summary', index=False)

	# ========================================
	# SHEET 2: VOXLINGUA107 DETAILED RESULTS
	# ========================================
	if results['voxlingua_detailed']:
	print(" 📋 Creating VoxLingua107 detailed results...")

	vox_detailed_df = pd.DataFrame(results['voxlingua_detailed'])

	# Add additional analysis columns
	vox_detailed_df['accuracy_score'] = vox_detailed_df['correct'].astype(int)
	vox_detailed_df['confidence_category'] = pd.cut(
	vox_detailed_df['confidence'],
	bins=[0, 0.3, 0.6, 0.8, 1.0],
	labels=['Low', 'Medium', 'High', 'Very High']
	)

	# Add language family information
	def get_language_family(lang):
	if lang in INDO_ARYAN_LANGS:
	return 'Indo-Aryan'
	elif lang in DRAVIDIAN_LANGS:
	return 'Dravidian'
	elif lang in LOW_RESOURCE_LANGS:
	return 'Low-Resource'
	else:
	return 'Other'

	vox_detailed_df['gt_language_family'] = vox_detailed_df['gt_iso'].apply(get_language_family)
	vox_detailed_df['pred_language_family'] = vox_detailed_df['pred_iso'].apply(get_language_family)

	vox_detailed_df.to_excel(writer, sheet_name='VoxLingua107_Results', index=False)

	# ========================================
	# SHEET 3: XLS-R DETAILED RESULTS
	# ========================================
	if results['xlsr_detailed']:
	print(" 📋 Creating XLS-R detailed results...")

	xlsr_detailed_df = pd.DataFrame(results['xlsr_detailed'])

	# Add analysis columns
	xlsr_detailed_df['accuracy_score'] = xlsr_detailed_df['correct'].astype(int)
	xlsr_detailed_df['confidence_category'] = pd.cut(
	xlsr_detailed_df['confidence'],
	bins=[0, 0.3, 0.6, 0.8, 1.0],
	labels=['Low', 'Medium', 'High', 'Very High']
	)
	xlsr_detailed_df['gt_language_family'] = xlsr_detailed_df['gt_iso'].apply(get_language_family)
	xlsr_detailed_df['pred_language_family'] = xlsr_detailed_df['pred_iso'].apply(get_language_family)

	xlsr_detailed_df.to_excel(writer, sheet_name='XLSR_Results', index=False)

	# ========================================
	# SHEET 4: PER-LANGUAGE ACCURACY ANALYSIS
	# ========================================
	print(" 📋 Creating per-language accuracy analysis...")

	lang_analysis_data = []

	# Get all unique languages from ground truth
	all_gt_langs = set()
	if results['voxlingua_detailed']:
	all_gt_langs.update([r['gt_iso'] for r in results['voxlingua_detailed'] if r['gt_iso']])
	if results['xlsr_detailed']:
	all_gt_langs.update([r['gt_iso'] for r in results['xlsr_detailed'] if r['gt_iso']])

	# Language name mapping
	LANG_NAMES = {
	'ur': 'Urdu', 'pa': 'Punjabi', 'ta': 'Tamil', 'sd': 'Sindhi', 'or': 'Odia',
	'ml': 'Malayalam', 'ne': 'Nepali', 'as': 'Assamese', 'hi': 'Hindi', 'bn': 'Bengali',
	'kok': 'Konkani', 'kn': 'Kannada', 'ks': 'Kashmiri', 'mr': 'Marathi', 'te': 'Telugu',
	'br': 'Bodo', 'doi': 'Dogri', 'sat': 'Santali', 'gu': 'Gujarati', 'mni': 'Manipuri',
	'sa': 'Sanskrit'
	}

	for lang in sorted(all_gt_langs):
	lang_name = LANG_NAMES.get(lang, lang.title())
	lang_family = get_language_family(lang)

	# VoxLingua stats for this language
	vox_stats = {'files': 0, 'correct': 0, 'accuracy': 0, 'avg_confidence': 0}
	if results['voxlingua_detailed']:
	vox_lang_data = [r for r in results['voxlingua_detailed'] if r['gt_iso'] == lang]
	if vox_lang_data:
	vox_stats['files'] = len(vox_lang_data)
	vox_stats['correct'] = sum(1 for r in vox_lang_data if r['correct'])
	vox_stats['accuracy'] = vox_stats['correct'] / vox_stats['files']
	vox_stats['avg_confidence'] = np.mean([r['confidence'] for r in vox_lang_data])

	# XLS-R stats for this language
	xlsr_stats = {'files': 0, 'correct': 0, 'accuracy': 0, 'avg_confidence': 0}
	if results['xlsr_detailed']:
	xlsr_lang_data = [r for r in results['xlsr_detailed'] if r['gt_iso'] == lang]
	if xlsr_lang_data:
	xlsr_stats['files'] = len(xlsr_lang_data)
	xlsr_stats['correct'] = sum(1 for r in xlsr_lang_data if r['correct'])
	xlsr_stats['accuracy'] = xlsr_stats['correct'] / xlsr_stats['files']
	xlsr_stats['avg_confidence'] = np.mean([r['confidence'] for r in xlsr_lang_data])

	lang_analysis_data.append({
	'Language_Code': lang,
	'Language_Name': lang_name,
	'Language_Family': lang_family,
	'VoxLingua_Files': vox_stats['files'],
	'VoxLingua_Correct': vox_stats['correct'],
	'VoxLingua_Accuracy': f"{vox_stats['accuracy']:.4f}",
	'VoxLingua_Accuracy_Pct': f"{vox_stats['accuracy']*100:.1f}%",
	'VoxLingua_Avg_Confidence': f"{vox_stats['avg_confidence']:.4f}",
	'XLSR_Files': xlsr_stats['files'],
	'XLSR_Correct': xlsr_stats['correct'],
	'XLSR_Accuracy': f"{xlsr_stats['accuracy']:.4f}",
	'XLSR_Accuracy_Pct': f"{xlsr_stats['accuracy']*100:.1f}%",
	'XLSR_Avg_Confidence': f"{xlsr_stats['avg_confidence']:.4f}",
	'Better_Model': 'VoxLingua' if vox_stats['accuracy'] > xlsr_stats['accuracy'] else 'XLS-R' if xlsr_stats['accuracy'] > vox_stats['accuracy'] else 'Tie'
	})

	lang_analysis_df = pd.DataFrame(lang_analysis_data)
	lang_analysis_df.to_excel(writer, sheet_name='Per_Language_Analysis', index=False)

	# ========================================
	# SHEET 5: CONFUSION MATRIX - VOXLINGUA
	# ========================================
	if results['voxlingua_detailed']:
	print(" 📋 Creating VoxLingua confusion matrix...")

	vox_df = pd.DataFrame(results['voxlingua_detailed'])
	valid_vox = vox_df[vox_df['gt_iso'] != ''].copy()

	if len(valid_vox) > 0:
	# Create confusion matrix
	confusion_data = []
	for gt_lang in sorted(valid_vox['gt_iso'].unique()):
	gt_data = valid_vox[valid_vox['gt_iso'] == gt_lang]
	row_data = {'Ground_Truth': gt_lang}

	for pred_lang in sorted(valid_vox['pred_iso'].unique()):
	count = len(gt_data[gt_data['pred_iso'] == pred_lang])
	row_data[f'Predicted_{pred_lang}'] = count

	confusion_data.append(row_data)

	confusion_df = pd.DataFrame(confusion_data).fillna(0)
	confusion_df.to_excel(writer, sheet_name='VoxLingua_Confusion_Matrix', index=False)

	# ========================================
	# SHEET 6: CONFUSION MATRIX - XLS-R
	# ========================================
	if results['xlsr_detailed']:
	print(" 📋 Creating XLS-R confusion matrix...")

	xlsr_df = pd.DataFrame(results['xlsr_detailed'])
	valid_xlsr = xlsr_df[xlsr_df['gt_iso'] != ''].copy()

	if len(valid_xlsr) > 0:
	confusion_data = []
	for gt_lang in sorted(valid_xlsr['gt_iso'].unique()):
	gt_data = valid_xlsr[valid_xlsr['gt_iso'] == gt_lang]
	row_data = {'Ground_Truth': gt_lang}

	for pred_lang in sorted(valid_xlsr['pred_iso'].unique()):
	count = len(gt_data[gt_data['pred_iso'] == pred_lang])
	row_data[f'Predicted_{pred_lang}'] = count

	confusion_data.append(row_data)

	confusion_df = pd.DataFrame(confusion_data).fillna(0)
	confusion_df.to_excel(writer, sheet_name='XLSR_Confusion_Matrix', index=False)

	# ========================================
	# SHEET 7: CONFIDENCE ANALYSIS
	# ========================================
	print(" 📋 Creating confidence analysis...")

	confidence_analysis = []

	# VoxLingua confidence analysis
	if results['voxlingua_detailed']:
	vox_df = pd.DataFrame(results['voxlingua_detailed'])
	valid_vox = vox_df[vox_df['gt_iso'] != ''].copy()

	if len(valid_vox) > 0:
	for conf_range in [(0, 0.3), (0.3, 0.6), (0.6, 0.8), (0.8, 1.0)]:
	range_data = valid_vox[
	(valid_vox['confidence'] >= conf_range[0]) &
	(valid_vox['confidence'] < conf_range[1])
	]

	if len(range_data) > 0:
	accuracy = (range_data['correct'] == True).mean()
	confidence_analysis.append({
	'Model': 'VoxLingua107',
	'Confidence_Range': f"{conf_range[0]:.1f}-{conf_range[1]:.1f}",
	'Files': len(range_data),
	'Accuracy': f"{accuracy:.4f}",
	'Accuracy_Pct': f"{accuracy*100:.1f}%",
	'Avg_Confidence': f"{range_data['confidence'].mean():.4f}"
	})

	# XLS-R confidence analysis
	if results['xlsr_detailed']:
	xlsr_df = pd.DataFrame(results['xlsr_detailed'])
	valid_xlsr = xlsr_df[xlsr_df['gt_iso'] != ''].copy()

	if len(valid_xlsr) > 0:
	for conf_range in [(0, 0.3), (0.3, 0.6), (0.6, 0.8), (0.8, 1.0)]:
	range_data = valid_xlsr[
	(valid_xlsr['confidence'] >= conf_range[0]) &
	(valid_xlsr['confidence'] < conf_range[1])
	]

	if len(range_data) > 0:
	accuracy = (range_data['correct'] == True).mean()
	confidence_analysis.append({
	'Model': 'XLS-R',
	'Confidence_Range': f"{conf_range[0]:.1f}-{conf_range[1]:.1f}",
	'Files': len(range_data),
	'Accuracy': f"{accuracy:.4f}",
	'Accuracy_Pct': f"{accuracy*100:.1f}%",
	'Avg_Confidence': f"{range_data['confidence'].mean():.4f}"
	})

	confidence_df = pd.DataFrame(confidence_analysis)
	confidence_df.to_excel(writer, sheet_name='Confidence_Analysis', index=False)

	# ========================================
	# SHEET 8: ERROR ANALYSIS
	# ========================================
	print(" 📋 Creating error analysis...")

	error_analysis = []

	# VoxLingua errors
	if results['voxlingua_detailed']:
	vox_df = pd.DataFrame(results['voxlingua_detailed'])
	vox_errors = vox_df[vox_df['correct'] == False].copy()

	for _, error in vox_errors.iterrows():
	error_analysis.append({
	'Model': 'VoxLingua107',
	'File': error['file'],
	'Ground_Truth': error['gt_iso'],
	'Predicted': error['pred_iso'],
	'Confidence': f"{error['confidence']:.4f}",
	'GT_Language_Family': get_language_family(error['gt_iso']),
	'Pred_Language_Family': get_language_family(error['pred_iso']),
	'Cross_Family_Error': get_language_family(error['gt_iso']) != get_language_family(error['pred_iso'])
	})

	# XLS-R errors
	if results['xlsr_detailed']:
	xlsr_df = pd.DataFrame(results['xlsr_detailed'])
	xlsr_errors = xlsr_df[xlsr_df['correct'] == False].copy()

	for _, error in xlsr_errors.iterrows():
	error_analysis.append({
	'Model': 'XLS-R',
	'File': error['file'],
	'Ground_Truth': error['gt_iso'],
	'Predicted': error['pred_iso'],
	'Confidence': f"{error['confidence']:.4f}",
	'GT_Language_Family': get_language_family(error['gt_iso']),
	'Pred_Language_Family': get_language_family(error['pred_iso']),
	'Cross_Family_Error': get_language_family(error['gt_iso']) != get_language_family(error['pred_iso'])
	})

	error_df = pd.DataFrame(error_analysis)
	error_df.to_excel(writer, sheet_name='Error_Analysis', index=False)

	# ========================================
	# SHEET 9: LANGUAGE FAMILY PERFORMANCE
	# ========================================
	print(" 📋 Creating language family performance...")

	family_performance = []

	families = ['Indo-Aryan', 'Dravidian', 'Low-Resource', 'Other']

	for family in families:
	# VoxLingua performance for this family
	if results['voxlingua_detailed']:
	vox_df = pd.DataFrame(results['voxlingua_detailed'])
	family_data = vox_df[vox_df['gt_iso'].apply(lambda x: get_language_family(x) == family)]

	if len(family_data) > 0:
	vox_acc = (family_data['correct'] == True).mean()
	vox_conf = family_data['confidence'].mean()
	vox_files = len(family_data)
	else:
	vox_acc = vox_conf = vox_files = 0
	else:
	vox_acc = vox_conf = vox_files = 0

	# XLS-R performance for this family
	if results['xlsr_detailed']:
	xlsr_df = pd.DataFrame(results['xlsr_detailed'])
	family_data = xlsr_df[xlsr_df['gt_iso'].apply(lambda x: get_language_family(x) == family)]

	if len(family_data) > 0:
	xlsr_acc = (family_data['correct'] == True).mean()
	xlsr_conf = family_data['confidence'].mean()
	xlsr_files = len(family_data)
	else:
	xlsr_acc = xlsr_conf = xlsr_files = 0
	else:
	xlsr_acc = xlsr_conf = xlsr_files = 0

	family_performance.append({
	'Language_Family': family,
	'VoxLingua_Files': vox_files,
	'VoxLingua_Accuracy': f"{vox_acc:.4f}",
	'VoxLingua_Accuracy_Pct': f"{vox_acc*100:.1f}%",
	'VoxLingua_Avg_Confidence': f"{vox_conf:.4f}",
	'XLSR_Files': xlsr_files,
	'XLSR_Accuracy': f"{xlsr_acc:.4f}",
	'XLSR_Accuracy_Pct': f"{xlsr_acc*100:.1f}%",
	'XLSR_Avg_Confidence': f"{xlsr_conf:.4f}",
	'Better_Model': 'VoxLingua' if vox_acc > xlsr_acc else 'XLS-R' if xlsr_acc > vox_acc else 'Tie'
	})

	family_df = pd.DataFrame(family_performance)
	family_df.to_excel(writer, sheet_name='Language_Family_Performance', index=False)

	# ========================================
	# SHEET 10: TOP-5 PREDICTIONS (SAMPLE)
	# ========================================
	print(" 📋 Creating Top-5 predictions sample...")

	top5_sample = []

	# Sample top-5 predictions from comparison data
	sample_files = results['comparison_data'][:20] # First 20 files as sample

	for file_data in sample_files:
	file_name = file_data['file']
	gt_lang = file_data['gt_iso']

	# VoxLingua Top-5
	if file_data['voxlingua']['available'] and 'top5_predictions' in file_data['voxlingua']:
	for pred in file_data['voxlingua']['top5_predictions']:
	top5_sample.append({
	'Model': 'VoxLingua107',
	'File': file_name,
	'Ground_Truth': gt_lang,
	'Rank': pred['rank'],
	'Predicted_Language': pred['mapped'],
	'Original_Output': pred['original'],
	'Confidence': f"{pred['confidence']:.4f}",
	'In_Dataset': pred['in_dataset'],
	'Correct': gt_lang == pred['mapped']
	})

	# XLS-R Top-5
	if file_data['xlsr']['available'] and 'top5_predictions' in file_data['xlsr']:
	for pred in file_data['xlsr']['top5_predictions']:
	top5_sample.append({
	'Model': 'XLS-R',
	'File': file_name,
	'Ground_Truth': gt_lang,
	'Rank': pred['rank'],
	'Predicted_Language': pred['mapped'],
	'Original_Output': pred['original'],
	'Confidence': f"{pred['confidence']:.4f}",
	'In_Dataset': pred['in_dataset'],
	'Correct': gt_lang == pred['mapped']
	})

	top5_df = pd.DataFrame(top5_sample)
	top5_df.to_excel(writer, sheet_name='Top5_Predictions_Sample', index=False)

	print(f"✅ Comprehensive Excel analysis created: {output_filename}")

	# Try to download the file
	try:
	from google.colab import files
	print(f"📥 File downloaded successfully!")
	except:
	print(f"📁 File saved locally: {output_filename}")

	return output_filename

	# Run the comprehensive Excel analysis
	if 'final_analysis_results' in globals() and final_analysis_results:
	excel_filename = create_comprehensive_excel_analysis(
	final_analysis_results,
	"Language_Detection_Comprehensive_Analysis.xlsx"
	)
	print(f"\n🎉 COMPREHENSIVE EXCEL ANALYSIS COMPLETE!")
	print(f"📊 File: {excel_filename}")

	# Print summary of what was created
	print(f"\n📋 Excel Contains 10 Sheets:")
	print(f" 1. Executive_Summary - Key metrics and recommendations")
	print(f" 2. VoxLingua107_Results - Detailed VoxLingua results")
	print(f" 3. XLSR_Results - Detailed XLS-R results")
	print(f" 4. Per_Language_Analysis - Accuracy by language")
	print(f" 5. VoxLingua_Confusion_Matrix - VoxLingua confusion matrix")
	print(f" 6. XLSR_Confusion_Matrix - XLS-R confusion matrix")
	print(f" 7. Confidence_Analysis - Performance by confidence ranges")
	print(f" 8. Error_Analysis - Detailed error breakdown")
	print(f" 9. Language_Family_Performance - Performance by language family")
	print(f" 10. Top5_Predictions_Sample - Sample of top-5 predictions")

	else:
	print("❌ No analysis results found. Please run the analysis first.")