Zum Inhalt springen

MediaWiki:Gadget-LabelScan.js: Unterschied zwischen den Versionen

Aus ADOS Wiki
Keine Bearbeitungszusammenfassung
Keine Bearbeitungszusammenfassung
Zeile 1: Zeile 1:
/* global mw, Tesseract */
/* global mw */
(function () {
(function () {
   'use strict';
   'use strict';


   // ========================================================================
   // ---------- Hilfsfunktionen für UI ----------
  //  KONFIG
   function $(id){ return document.getElementById(id); }
  // ========================================================================
   function status(t){ const el=$('ados-scan-status'); if(el) el.textContent = t || ''; }
  // In welchen Kategorien wird gesucht?
  function progress(v){
  const ADOS_CATEGORIES = [
    const bar=$('ados-scan-progress');
    'Alle A Dream of Scotland Abfüllungen',
    if(!bar) return;
    'Alle A Dream of Ireland Abfüllungen',
    if(v == null){ bar.hidden = true; bar.value = 0; }
    'Alle A Dream of... – Der Rest der Welt Abfüllungen',
    else { bar.hidden = false; bar.value = Math.max(0, Math.min(1, v)); }
    'Friendly Mr. Z Whiskytainment Abfüllungen',
    'Die Whisky Elfen Abfüllungen',
    'The Fine Art of Whisky Abfüllungen',
    'Alle Rumbastic Abfüllungen'
  ];
 
  // Häufige Distillery-/Serien-Tokens (zum „Einhaken“ in die Suche)
  const KNOWN_TOKENS = [
    'Ardbeg','Ardmore','Arran','Auchroisk','Ben Nevis','Blair Athol','Bowmore',
    'Caol Ila','Clynelish','Glenallachie','Glenrothes','Longmorn','Lagavulin',
    'Tullibardine','Dalmore','Benrinnes','Mortlach','Glenlivet','Inchgower',
    'Islay','Speyside','Highland','Lowland','Campbeltown','Ireland',
    'A Dream of Scotland','A Dream of Ireland','The Fine Art of Whisky',
    'The Tasteful 8','Friendly Mr. Z','Die Whisky Elfen','Rumbastic'
  ];
 
  // Debug: Roh-OCR unten anzeigen, wenn true
  window.ADOS_SCAN_DEBUG = window.ADOS_SCAN_DEBUG || false;
 
  // ========================================================================
  //  DOM-Helfer
  // ========================================================================
   function byId(id){ return document.getElementById(id); }
   function hasUI(){
    return !!byId('ados-scan-run') && !!byId('ados-scan-file');
   }
   }
   function setStatus(t){ const el = byId('ados-scan-status'); if (el) el.textContent = t || ''; }
   function preview(file){
  function setProgress(p){
     const p = $('ados-scan-preview');
     const bar = byId('ados-scan-progress'); if (!bar) return;
     if(!p) return;
     if (p == null){ bar.hidden = true; bar.value = 0; }
    else { bar.hidden = false; bar.value = Math.max(0, Math.min(1, p)); }
  }
  function showPreview(file){
     const url = URL.createObjectURL(file);
     const url = URL.createObjectURL(file);
     const prev = byId('ados-scan-preview');
     p.innerHTML = '<img alt="Vorschau" style="max-width:100%;height:auto;border-radius:8px" />';
    if (prev){ prev.innerHTML = '<img alt="Vorschau" src="'+url+'">'; prev.setAttribute('aria-hidden','false'); }
    p.querySelector('img').src = url;
   }
   }


   // ========================================================================
   // ---------- Tesseract sauber laden (Worker/WASM/CDN) ----------
  //  TESSERACT sauber als WORKER laden (deu+eng)
   let _tessReady = null;
  // ========================================================================
   const TESS_CDN = 'https://cdn.jsdelivr.net/npm/tesseract.js@5/dist/';
   let _ocrWorkerPromise = null;
  async function ensureTesseract(){
   function getOcrWorker(){
    if(_tessReady) return _tessReady;
    if (_ocrWorkerPromise) return _ocrWorkerPromise;
    _tessReady = new Promise((resolve, reject) => {
    _ocrWorkerPromise = (async () => {
      if(window.Tesseract) return resolve();
      if (!window.Tesseract){
        await new Promise((res, rej) => {
          const s=document.createElement('script');
          s.src='https://cdn.jsdelivr.net/npm/tesseract.js@5/dist/tesseract.min.js';
          s.async=true; s.onload=res; s.onerror=() => {
            const s2=document.createElement('script');
            s2.src='https://unpkg.com/tesseract.js@5/dist/tesseract.min.js';
            s2.async=true; s2.onload=res; s2.onerror=rej; document.head.appendChild(s2);
          };
          document.head.appendChild(s);
        });
      }
      const { createWorker } = Tesseract;
      const worker = await createWorker({
        workerPath: 'https://cdn.jsdelivr.net/npm/tesseract.js@5/dist/worker.min.js',
        corePath:  'https://cdn.jsdelivr.net/npm/tesseract.js-core@5/tesseract-core.wasm.js',
        langPath:  'https://tessdata.projectnaptha.com/5',
        logger: m => {
          if (m && m.status === 'recognizing text' && typeof m.progress === 'number'){
            setProgress(0.05 + m.progress * 0.9);
          }
        }
      });
      await worker.loadLanguage('deu+eng');
      await worker.initialize('deu+eng');
      await worker.setParameters({ tessedit_pageseg_mode: '11', user_defined_dpi: '300' });
      return worker;
    })();
    return _ocrWorkerPromise;
  }


  // ========================================================================
      const s = document.createElement('script');
  //  Bild-Vorverarbeitung: Skalierung + adaptives Thresholding
      s.src = TESS_CDN + 'tesseract.min.js';
  // ========================================================================
      s.async = true;
  function scaleToCanvas(img, maxSide = 2000){
       s.onload = () => resolve();
    const s = Math.min(1, maxSide / Math.max(img.width, img.height));
       s.onerror = () => reject(new Error('Tesseract.js konnte nicht geladen werden'));
    const w = Math.round(img.width * s), h = Math.round(img.height * s);
       document.head.appendChild(s);
    const c = document.createElement('canvas'); c.width=w; c.height=h;
     });
    const ctx=c.getContext('2d'); ctx.imageSmoothingEnabled = true;
     return _tessReady;
    ctx.drawImage(img,0,0,w,h);
    return c;
  }
 
  function adaptiveThreshold(src){
    const w=src.width, h=src.height;
    const out=document.createElement('canvas'); out.width=w; out.height=h;
    const sctx=src.getContext('2d'), octx=out.getContext('2d');
    const id=sctx.getImageData(0,0,w,h), d=id.data;
    const gray=new Uint8ClampedArray(w*h);
    for(let i=0,j=0;i<d.length;i+=4,++j){
       gray[j]=(0.2126*d[i]+0.7152*d[i+1]+0.0722*d[i+2])|0;
    }
    const S=new Uint32Array((w+1)*(h+1));
    for(let y=1;y<=h;y++){
      let row=0;
      for(let x=1;x<=w;x++){
        const v=gray[(y-1)*w + (x-1)];
        row+=v; S[y*(w+1)+x]=S[(y-1)*(w+1)+x]+row;
       }
    }
    const win=Math.max(15, Math.round(Math.min(w,h)/24));
    const outId=octx.createImageData(w,h), od=outId.data;
    const C=7;
    for(let y=0;y<h;y++){
      const y0=Math.max(0,y-win), y1=Math.min(h-1,y+win);
       for(let x=0;x<w;x++){
        const x0=Math.max(0,x-win), x1=Math.min(w-1,x+win);
        const A=S[y0*(w+1)+x0], B=S[(y1+1)*(w+1)+x0], Cc=S[y0*(w+1)+(x1+1)], Dd=S[(y1+1)*(w+1)+(x1+1)];
        const area=(x1-x0+1)*(y1-y0+1);
        const mean=(Dd + A - B - Cc)/area;
        const g=gray[y*w+x];
        const pix = g < (mean - C) ? 0 : 255;
        const k=(y*w+x)*4; od[k]=od[k+1]=od[k+2]=pix; od[k+3]=255;
      }
     }
    octx.putImageData(outId,0,0);
     return out;
   }
   }


   // ========================================================================
   // Kleines Canvas-Preprocessing (Grayscale & leichter Kontrast)
  //  OCR: mehrere Strategien (PSM 11 → 6 → 4, binarisiert & farbig)
   async function preprocess(file){
  // ========================================================================
   async function runOCR(file){
    setProgress(0.02);
     const img = await new Promise((res, rej) => {
     const img = await new Promise((res, rej) => {
       const o=new Image(); o.onload=()=>res(o); o.onerror=rej;
       const i = new Image();
       o.src=URL.createObjectURL(file);
      i.onload = () => res(i);
      i.onerror = rej;
       i.src = URL.createObjectURL(file);
     });
     });
    const MAX = 1800;
    const scale = (img.width > img.height) ? (MAX / img.width) : (MAX / img.height);
    const w = Math.round(img.width * scale);
    const h = Math.round(img.height * scale);
    const c = document.createElement('canvas');
    c.width = w; c.height = h;
    const ctx = c.getContext('2d');
    ctx.imageSmoothingEnabled = true;
    ctx.drawImage(img, 0, 0, w, h);


     const base = scaleToCanvas(img, 2000);
     const id = ctx.getImageData(0,0,w,h), d=id.data;
    const bin  = adaptiveThreshold(base);
     for(let i=0;i<d.length;i+=4){
 
       const g = 0.2126*d[i] + 0.7152*d[i+1] + 0.0722*d[i+2];
    const worker = await getOcrWorker();
       const v = Math.max(0, Math.min(255, (g-128)*1.12 + 128)); // leichte Kontrastanhebung
    const candidates = [
       d[i]=d[i+1]=d[i+2]=v;
      { canvas: bin, psm: '11' },
      { canvas: base, psm: '11' },
      { canvas: bin,  psm: '6'  },
      { canvas: base, psm: '6'  },
      { canvas: bin, psm: '4'  },
      { canvas: base, psm: '4'  }
    ];
 
    let best = '';
     for (let i=0;i<candidates.length;i++){
       const c = candidates[i];
      await worker.setParameters({ tessedit_pageseg_mode: c.psm });
       const { data } = await worker.recognize(c.canvas);
      const txt = (data && data.text ? data.text : '').trim();
      if (txt.length > best.length) best = txt;
      if (best.length > 40) break;
       setProgress(0.96 + i * 0.008);
     }
     }
     setProgress(null);
     ctx.putImageData(id,0,0);
 
     return c;
    if (window.ADOS_SCAN_DEBUG){
      const box = byId('ados-scan-ocr');
      if (box) box.textContent = best || '(leer)';
    }
     return best;
   }
   }


   // ========================================================================
   // ---------- OCR ----------
  //  Hinweise aus OCR destillieren
   async function runOCR(file){
  // ========================================================================
    await ensureTesseract();
   function extractHints(text){
     const { createWorker } = window.Tesseract;
     const raw = String(text||'').replace(/\s+/g,' ').trim();


     const names = [];
    // Pfade hart setzen, damit Worker/WASM sicher gefunden werden
    KNOWN_TOKENS.forEach(t=>{
     const worker = await createWorker({
       const re = new RegExp('\\b'+t.replace(/[.*+?^${}()|[\]\\]/g,'\\$&')+'\\b','i');
       workerPath: TESS_CDN + 'worker.min.js',
      if (re.test(raw)) names.push(t);
      langPath:  TESS_CDN + 'langs/',
      corePath:  TESS_CDN + 'tesseract-core.wasm.js',
      logger: m => {
        if(m && typeof m.progress === 'number'){
          progress(m.progress);
        }
        if(m && m.status) {
          // optionales Debug
          // console.log('[OCR]', m.status, m.progress ?? '');
        }
      }
     });
     });


     const ageRe = /\b([1-9]\d?)\s?(?:years?|yo|jahr(?:e)?)\b/gi;
     try {
    const ages=[]; let m; while((m=ageRe.exec(raw))!==null){ if(!ages.includes(m[1])) ages.push(m[1]); }
      await worker.loadLanguage('eng+deu');
      await worker.initialize('eng+deu');


    const yearRe = /\b(19|20)\d{2}\b/g;
      const canvas = await preprocess(file);
    const years=[]; while((m=yearRe.exec(raw))!==null){ if(!years.includes(m[0])) years.push(m[0]); }


    const wordRe = /\b[A-ZÄÖÜ][A-Za-zÄÖÜäöüß\-]{3,}\b/g;
      // psm 6 = Block Text; oem 1 = LSTM
    const uniq=new Set(); const words=[]; let w;
      await worker.setParameters({
    while((w=wordRe.exec(raw))!==null){ const s=w[0]; if(!uniq.has(s)){ uniq.add(s); words.push(s); if(words.length>=8) break; } }
        tessedit_pageseg_mode: '6',
        preserve_interword_spaces: '1'
      });


     return { names, ages, years, words, raw };
      const result = await worker.recognize(canvas);
      const text = (result && result.data && result.data.text) ? result.data.text : '';
      return text.trim();
     } finally {
      await worker.terminate();
      progress(null);
    }
   }
   }


   // ========================================================================
   // ---------- einfache Treffer-Suche im Wiki ----------
  //  Suche im Wiki (3 Pässe)
   async function searchTitles(q){
  // ========================================================================
   async function searchWikiSmart(hints, limit){
     await mw.loader.using('mediawiki.api');
     await mw.loader.using('mediawiki.api');
     const api = new mw.Api();
     const api = new mw.Api();
    const MAX = limit || 12, ns0=0;


     function incats(){
     // sehr einfache Heuristik: nimm 3–5 „gute“ Wörter aus dem OCR
       return ADOS_CATEGORIES.map(c => 'incategory:"'+c+'"').join(' ');
    const words = String(q || '')
    }
       .replace(/[^\p{L}\p{N}\s\-']/gu,' ')
      .replace(/\s+/g,' ')
      .trim()
      .split(' ')
      .filter(w => w.length >= 3)
      .slice(0, 6);


    const pass1=[];
     if(!words.length) return [];
     if (hints.names.length){
      hints.names.forEach(n=>{
        if (hints.ages.length) hints.ages.forEach(a=> pass1.push(`intitle:"${n}" intitle:${a} ${incats()}`));
        if (hints.years.length) hints.years.forEach(y=> pass1.push(`intitle:"${n}" "${y}" ${incats()}`));
        pass1.push(`intitle:"${n}" ${incats()}`);
      });
    }


     const key=[].concat(hints.names.slice(0,2), hints.ages.slice(0,1), hints.years.slice(0,1), hints.words.slice(0,3))
     const sr = await api.get({
                .map(x=>`"${x}"`).join(' ');
      action: 'query',
     const pass2 = key ? [ `${key} ${incats()}` ] : [];
      list: 'search',
      srsearch: words.map(w => `"${w}"`).join(' '), // UND-verkettet
      srlimit: 12,
      srnamespace: 0,
      formatversion: 2
     });


     const pass3=[];
     return (sr.query && sr.query.search) ? sr.query.search : [];
    if (hints.names.length) pass3.push(hints.names[0]);
    if (!pass3.length && hints.words.length) pass3.push(hints.words[0]);
 
    const seen=new Set(), out=[];
 
    async function runSr(q){
      const r = await api.get({ action:'query', list:'search', srsearch:q, srnamespace:ns0, srlimit:MAX, formatversion:2 });
      (r.query?.search || []).forEach(it=>{
        const k=it.title; if (seen.has(k)) return; seen.add(k); out.push(it);
      });
    }
 
    for (const q of pass1){ await runSr(q); if (out.length>=MAX) return out.slice(0,MAX); }
    for (const q of pass2){ await runSr(q); if (out.length>=MAX) return out.slice(0,MAX); }
 
    for (const p of pass3){
      const r = await api.get({ action:'query', list:'prefixsearch', pssearch:p, psnamespace:ns0, pslimit:MAX });
      (r.query?.prefixsearch || []).forEach(it=>{
        const title = it.title || it['*']; const k=title;
        if (seen.has(k)) return; seen.add(k); out.push({ title, snippet:'' });
      });
      if (out.length>=MAX) break;
    }
 
    return out.slice(0,MAX);
   }
   }


  // ========================================================================
  //  Treffer rendern
  // ========================================================================
  function esc(s){ return mw.html.escape(String(s||'')); }
   function renderResults(items){
   function renderResults(items){
     const box = byId('ados-scan-results'); if (!box) return;
     const box = $('ados-scan-results');
     box.innerHTML='';
    if(!box) return;
     if (!items || !items.length){
     box.innerHTML = '';
       box.innerHTML='<div class="ados-hit">Keine klaren Treffer. Bitte anderes Foto oder manuell suchen.</div>';
     if(!items || !items.length){
       box.innerHTML = '<div class="ados-hit">Keine klaren Treffer. Bitte anderes Foto oder manuell suchen.</div>';
       return;
       return;
     }
     }
     items.slice(0,12).forEach(it=>{
     items.forEach(it => {
       const title = it.title || '';
       const title = it.title || '';
       const link  = mw.util.getUrl(title.replace(/ /g,'_'));
       const link  = mw.util.getUrl(title.replace(/ /g,'_'));
       const snip  = String(it.snippet||'').replace(/<\/?span[^>]*>/g,'').replace(/&quot;/g,'"');
       const snip  = String(it.snippet || '').replace(/<\/?span[^>]*>/g,'').replace(/&quot;/g,'"');
       const div=document.createElement('div'); div.className='ados-hit';
       const div = document.createElement('div');
       div.innerHTML = '<b><a href="'+link+'">'+esc(title)+'</a></b>' + (snip?'<div class="meta">'+snip+'</div>':'');
      div.className = 'ados-hit';
       div.innerHTML = '<b><a href="'+link+'">'+mw.html.escape(title)+'</a></b>' + (snip ? '<div class="meta">'+snip+'</div>' : '');
       box.appendChild(div);
       box.appendChild(div);
     });
     });
   }
   }


   // ========================================================================
   // ---------- Bindings ----------
  //  BINDING
  // ========================================================================
  let BOUND=false;
   function bind(){
   function bind(){
    if (BOUND || !hasUI()) return;
     const run = $('ados-scan-run');
     const runBtn = byId('ados-scan-run');
     const file= $('ados-scan-file');
     const fileIn = byId('ados-scan-file');
     const big = $('ados-scan-bigbtn');
     const bigBtn = byId('ados-scan-bigbtn');
 
     const drop  = byId('ados-scan-drop');
     if(!run || !file) return;


     if (!runBtn || !fileIn) return;
     if(big){ big.addEventListener('click', () => file.click()); }
     if (runBtn.dataset.bound === '1') return;
     file.addEventListener('change', () => { if(file.files && file.files[0]) preview(file.files[0]); });
    runBtn.dataset.bound='1'; BOUND=true;
 
    run.addEventListener('click', async (ev) => {
      ev.preventDefault();
      if(!(file.files && file.files[0])){
        alert('Bitte zuerst ein Foto auswählen oder aufnehmen.');
        return;
      }


    if (bigBtn) bigBtn.addEventListener('click', () => fileIn.click());
      const f = file.files[0];
    fileIn.addEventListener('change', function(){ if (this.files && this.files[0]) showPreview(this.files[0]); });
      run.disabled = true;
      const old = run.textContent;
      run.textContent = 'Erkenne …';
      status('Erkenne Label …');
      progress(0);


    // Drag&Drop
      try {
    if (drop){
        // 1) OCR
      ['dragenter','dragover'].forEach(ev=> drop.addEventListener(ev, e=>{ e.preventDefault(); drop.classList.add('is-drag'); }));
        const text = await runOCR(f);
      ['dragleave','drop'].forEach(ev=> drop.addEventListener(ev, e=>{ e.preventDefault(); drop.classList.remove('is-drag'); }));
        // Debug-Ausgabe für dich:
      drop.addEventListener('drop', e=>{
        const dbg = $('ados-scan-ocr');
        const f = e.dataTransfer && e.dataTransfer.files && e.dataTransfer.files[0];
         if(dbg){ dbg.textContent = text; }
         if (f){ fileIn.files = e.dataTransfer.files; showPreview(f); }
      });
    }


    // Klick „Erkennen & suchen“
        // 2) Suche
    runBtn.addEventListener('click', async function(ev){
         status('Suche im Wiki …');
      ev.preventDefault();
         const hits = await searchTitles(text);
      if (!(fileIn.files && fileIn.files[0])){ alert('Bitte ein Foto auswählen oder aufnehmen.'); return; }
      const f = fileIn.files[0];
      try{
        runBtn.disabled=true; runBtn.textContent='Erkenne …';
         setStatus('Erkenne Label …');
        const text  = await runOCR(f);
        setStatus('Suche im Wiki …');
        const hints = extractHints(text);
         const hits = await searchWikiSmart(hints, 12);
         renderResults(hits);
         renderResults(hits);
         setStatus('Fertig.');
         status('Fertig.');
       } catch(e){
       } catch(err){
         console.error('[LabelScan]', e);
         console.error('[LabelScan] Fehler:', err);
         setStatus('Fehler bei Erkennung/Suche. Bitte erneut versuchen.');
         status('Fehler bei Erkennung/Suche. Bitte erneut versuchen.');
       } finally {
       } finally {
         runBtn.disabled=false; runBtn.textContent='🔍 Erkennen & suchen';
         progress(null);
        run.disabled = false;
        run.textContent = old;
       }
       }
     });
     });


     // Sicherheit gegen Overlays
     console.log('[LabelScan] Gadget gebunden.');
    const wrap = byId('ados-labelscan'); if (wrap) wrap.style.position='relative';
    runBtn.style.position='relative'; runBtn.style.zIndex='9999'; runBtn.style.pointerEvents='auto';
   }
   }


  // Erstbindung + Fallbacks + Observer
   if(document.readyState === 'loading'){
   if (document.readyState === 'loading'){ document.addEventListener('DOMContentLoaded', bind); } else { bind(); }
    document.addEventListener('DOMContentLoaded', bind);
  setTimeout(bind, 250); setTimeout(bind, 1000);
  } else {
   const mo = new MutationObserver(() => { if (!BOUND) bind(); });
    bind();
  mo.observe(document.documentElement || document.body, { childList:true, subtree:true });
   }
 
})();
})();

Version vom 6. November 2025, 20:26 Uhr

/* global mw */
(function () {
  'use strict';

  // ---------- Hilfsfunktionen für UI ----------
  function $(id){ return document.getElementById(id); }
  function status(t){ const el=$('ados-scan-status'); if(el) el.textContent = t || ''; }
  function progress(v){
    const bar=$('ados-scan-progress');
    if(!bar) return;
    if(v == null){ bar.hidden = true; bar.value = 0; }
    else { bar.hidden = false; bar.value = Math.max(0, Math.min(1, v)); }
  }
  function preview(file){
    const p = $('ados-scan-preview');
    if(!p) return;
    const url = URL.createObjectURL(file);
    p.innerHTML = '<img alt="Vorschau" style="max-width:100%;height:auto;border-radius:8px" />';
    p.querySelector('img').src = url;
  }

  // ---------- Tesseract sauber laden (Worker/WASM/CDN) ----------
  let _tessReady = null;
  const TESS_CDN = 'https://cdn.jsdelivr.net/npm/tesseract.js@5/dist/';
  async function ensureTesseract(){
    if(_tessReady) return _tessReady;
    _tessReady = new Promise((resolve, reject) => {
      if(window.Tesseract) return resolve();

      const s = document.createElement('script');
      s.src = TESS_CDN + 'tesseract.min.js';
      s.async = true;
      s.onload = () => resolve();
      s.onerror = () => reject(new Error('Tesseract.js konnte nicht geladen werden'));
      document.head.appendChild(s);
    });
    return _tessReady;
  }

  // Kleines Canvas-Preprocessing (Grayscale & leichter Kontrast)
  async function preprocess(file){
    const img = await new Promise((res, rej) => {
      const i = new Image();
      i.onload = () => res(i);
      i.onerror = rej;
      i.src = URL.createObjectURL(file);
    });
    const MAX = 1800;
    const scale = (img.width > img.height) ? (MAX / img.width) : (MAX / img.height);
    const w = Math.round(img.width * scale);
    const h = Math.round(img.height * scale);
    const c = document.createElement('canvas');
    c.width = w; c.height = h;
    const ctx = c.getContext('2d');
    ctx.imageSmoothingEnabled = true;
    ctx.drawImage(img, 0, 0, w, h);

    const id = ctx.getImageData(0,0,w,h), d=id.data;
    for(let i=0;i<d.length;i+=4){
      const g = 0.2126*d[i] + 0.7152*d[i+1] + 0.0722*d[i+2];
      const v = Math.max(0, Math.min(255, (g-128)*1.12 + 128)); // leichte Kontrastanhebung
      d[i]=d[i+1]=d[i+2]=v;
    }
    ctx.putImageData(id,0,0);
    return c;
  }

  // ---------- OCR ----------
  async function runOCR(file){
    await ensureTesseract();
    const { createWorker } = window.Tesseract;

    // Pfade hart setzen, damit Worker/WASM sicher gefunden werden
    const worker = await createWorker({
      workerPath: TESS_CDN + 'worker.min.js',
      langPath:   TESS_CDN + 'langs/',
      corePath:   TESS_CDN + 'tesseract-core.wasm.js',
      logger: m => {
        if(m && typeof m.progress === 'number'){
          progress(m.progress);
        }
        if(m && m.status) {
          // optionales Debug
          // console.log('[OCR]', m.status, m.progress ?? '');
        }
      }
    });

    try {
      await worker.loadLanguage('eng+deu');
      await worker.initialize('eng+deu');

      const canvas = await preprocess(file);

      // psm 6 = Block Text; oem 1 = LSTM
      await worker.setParameters({
        tessedit_pageseg_mode: '6',
        preserve_interword_spaces: '1'
      });

      const result = await worker.recognize(canvas);
      const text = (result && result.data && result.data.text) ? result.data.text : '';
      return text.trim();
    } finally {
      await worker.terminate();
      progress(null);
    }
  }

  // ---------- einfache Treffer-Suche im Wiki ----------
  async function searchTitles(q){
    await mw.loader.using('mediawiki.api');
    const api = new mw.Api();

    // sehr einfache Heuristik: nimm 3–5 „gute“ Wörter aus dem OCR
    const words = String(q || '')
      .replace(/[^\p{L}\p{N}\s\-']/gu,' ')
      .replace(/\s+/g,' ')
      .trim()
      .split(' ')
      .filter(w => w.length >= 3)
      .slice(0, 6);

    if(!words.length) return [];

    const sr = await api.get({
      action: 'query',
      list: 'search',
      srsearch: words.map(w => `"${w}"`).join(' '), // UND-verkettet
      srlimit: 12,
      srnamespace: 0,
      formatversion: 2
    });

    return (sr.query && sr.query.search) ? sr.query.search : [];
  }

  function renderResults(items){
    const box = $('ados-scan-results');
    if(!box) return;
    box.innerHTML = '';
    if(!items || !items.length){
      box.innerHTML = '<div class="ados-hit">Keine klaren Treffer. Bitte anderes Foto oder manuell suchen.</div>';
      return;
    }
    items.forEach(it => {
      const title = it.title || '';
      const link  = mw.util.getUrl(title.replace(/ /g,'_'));
      const snip  = String(it.snippet || '').replace(/<\/?span[^>]*>/g,'').replace(/&quot;/g,'"');
      const div = document.createElement('div');
      div.className = 'ados-hit';
      div.innerHTML = '<b><a href="'+link+'">'+mw.html.escape(title)+'</a></b>' + (snip ? '<div class="meta">'+snip+'</div>' : '');
      box.appendChild(div);
    });
  }

  // ---------- Bindings ----------
  function bind(){
    const run = $('ados-scan-run');
    const file= $('ados-scan-file');
    const big = $('ados-scan-bigbtn');

    if(!run || !file) return;

    if(big){ big.addEventListener('click', () => file.click()); }
    file.addEventListener('change', () => { if(file.files && file.files[0]) preview(file.files[0]); });

    run.addEventListener('click', async (ev) => {
      ev.preventDefault();
      if(!(file.files && file.files[0])){
        alert('Bitte zuerst ein Foto auswählen oder aufnehmen.');
        return;
      }

      const f = file.files[0];
      run.disabled = true;
      const old = run.textContent;
      run.textContent = 'Erkenne …';
      status('Erkenne Label …');
      progress(0);

      try {
        // 1) OCR
        const text = await runOCR(f);
        // Debug-Ausgabe für dich:
        const dbg = $('ados-scan-ocr');
        if(dbg){ dbg.textContent = text; }

        // 2) Suche
        status('Suche im Wiki …');
        const hits = await searchTitles(text);
        renderResults(hits);
        status('Fertig.');
      } catch(err){
        console.error('[LabelScan] Fehler:', err);
        status('Fehler bei Erkennung/Suche. Bitte erneut versuchen.');
      } finally {
        progress(null);
        run.disabled = false;
        run.textContent = old;
      }
    });

    console.log('[LabelScan] Gadget gebunden.');
  }

  if(document.readyState === 'loading'){
    document.addEventListener('DOMContentLoaded', bind);
  } else {
    bind();
  }
})();