{
  "version": "1.0.0",
  "exported_at": "2026-06-02T00:00:00.000Z",
  "project": {
    "name": "Willhaben Job Scraper Details",
    "description": "Scrapes Willhaben.at job detail pages by URL, matching the Octoparse detail-page fields: Original_URL, Titel, Beschäftigungsart, Beschäftigungssituation, Startzeit_der_Beschäftigung, Arbeitsort, Erforderliche_Sprachkenntnisse, Bruttogehalt, Arbeitgeber, Gründungsjahr, Aktuelles_Job, and Firmenprofil. Navigation strategy: multi-URL detail-page loop using navigate.urls[] plus loop-continue. Replace or extend navigate-1.config.urls with the complete set of Willhaben job detail URLs to scrape. If an expired detail URL redirects to a similar-jobs search page, the workflow attempts to open the first current job detail result before extraction.",
    "color": "bg-[#4589ff]",
    "template_id": "ai-generated"
  },
  "blocks": [
    {
      "block_id": "set-window-size-1",
      "block_type": "process",
      "title": "Set Window Size",
      "description": "Set browser window dimensions",
      "position_x": 120,
      "position_y": 240,
      "config": {
        "width": 1920,
        "height": 1080,
        "color": "bg-[#4589ff]"
      }
    },
    {
      "block_id": "navigate-1",
      "block_type": "process",
      "title": "Navigate",
      "description": "Go to a URL",
      "position_x": 480,
      "position_y": 240,
      "config": {
        "urls": [
          "https://www.willhaben.at/jobs/job/kfz-lackierer-w-m-d/13158490",
          "https://www.willhaben.at/jobs/job/friseur-in-fuer-15-40-stunden/13113239"
        ],
        "color": "bg-[#4589ff]"
      }
    },
    {
      "block_id": "wait-for-page-load-1",
      "block_type": "process",
      "title": "Wait for Page Load",
      "description": "Wait for page to finish loading",
      "position_x": 840,
      "position_y": 240,
      "config": {
        "timeout": 30,
        "color": "bg-[#08bdba]"
      }
    },
    {
      "block_id": "inject-javascript-1",
      "block_type": "process",
      "title": "Inject JavaScript",
      "description": "Run custom JavaScript on the page",
      "position_x": 1200,
      "position_y": 240,
      "config": {
        "jsCode": "try { const labels = ['Accept', 'Akzeptieren', 'Alle akzeptieren', 'Zustimmen', 'Einverstanden', 'OK']; const buttons = Array.from(document.querySelectorAll('button, [role=\"button\"')); const btn = buttons.find(b => labels.some(l => (b.innerText || b.textContent || '').trim().toLowerCase().includes(l.toLowerCase()))); if (btn) btn.click(); } catch (e) {}",
        "waitForCompletion": true,
        "timeout": 5,
        "color": "bg-[#a56eff]"
      }
    },
    {
      "block_id": "sleep-1",
      "block_type": "process",
      "title": "Sleep",
      "description": "Wait for specified time",
      "position_x": 1560,
      "position_y": 240,
      "config": {
        "duration": 2,
        "color": "bg-[#08bdba]"
      }
    },
    {
      "block_id": "inject-javascript-2",
      "block_type": "process",
      "title": "Inject JavaScript",
      "description": "Run custom JavaScript on the page",
      "position_x": 1920,
      "position_y": 240,
      "config": {
        "jsCode": "try { if (!location.pathname.includes('/jobs/job/')) { const links = Array.from(document.querySelectorAll('a[href*=\"/jobs/job/\"]')); const jobLink = links.find(a => { const href = a.getAttribute('href') || ''; const text = (a.innerText || a.textContent || '').trim(); return href && text && !href.includes('similarAdvert'); }); if (jobLink) location.href = new URL(jobLink.getAttribute('href'), location.href).href; } } catch (e) {}",
        "waitForCompletion": true,
        "timeout": 5,
        "color": "bg-[#a56eff]"
      }
    },
    {
      "block_id": "wait-for-page-load-2",
      "block_type": "process",
      "title": "Wait for Page Load",
      "description": "Wait for page to finish loading",
      "position_x": 2280,
      "position_y": 240,
      "config": {
        "timeout": 30,
        "color": "bg-[#08bdba]"
      }
    },
    {
      "block_id": "sleep-2",
      "block_type": "process",
      "title": "Sleep",
      "description": "Wait for specified time",
      "position_x": 2640,
      "position_y": 240,
      "config": {
        "duration": 2,
        "color": "bg-[#08bdba]"
      }
    },
    {
      "block_id": "wait-for-element-1",
      "block_type": "process",
      "title": "Wait for Element",
      "description": "Wait until element appears",
      "position_x": 3000,
      "position_y": 240,
      "config": {
        "selector": "body",
        "timeout": 30,
        "visible": true,
        "color": "bg-[#08bdba]"
      }
    },
    {
      "block_id": "structured-export-1",
      "block_type": "process",
      "title": "Structured Export",
      "description": "Export data with custom columns",
      "position_x": 3360,
      "position_y": 240,
      "config": {
        "rowSelector": "body",
        "fileName": "willhaben_job_scraper_details.csv",
        "saveLocation": "C:\\Users\\theskd\\Documents\\UScraper\\templates",
        "includeHeaders": true,
        "fileMode": "append",
        "color": "bg-[#42be65]",
        "columns": [
          {
            "name": "Original_URL",
            "selector": "window.location.href",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Titel",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const job = () => { for (const s of document.querySelectorAll('script[type=\"application/ld+json\"]')) { try { const v = JSON.parse(s.textContent); const arr = Array.isArray(v) ? v : [v]; const all = arr.concat(...arr.map(x => Array.isArray(x && x['@graph']) ? x['@graph'] : [])); for (const x of all) if (x && String(x['@type']).includes('JobPosting')) return x; } catch(e) {} } return {}; }; const j = job(); return n(j.title) || n(document.querySelector('h1')?.innerText) || n(document.title.replace(/\\s*\\|.*$/, '')); })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Beschäftigungsart",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const job = () => { for (const s of document.querySelectorAll('script[type=\"application/ld+json\"]')) { try { const v = JSON.parse(s.textContent); const arr = Array.isArray(v) ? v : [v]; const all = arr.concat(...arr.map(x => Array.isArray(x && x['@graph']) ? x['@graph'] : [])); for (const x of all) if (x && String(x['@type']).includes('JobPosting')) return x; } catch(e) {} } return {}; }; const j = job(); const raw = Array.isArray(j.employmentType) ? j.employmentType.join(', ') : n(j.employmentType); const mapped = raw.replace(/FULL_TIME/gi, 'Vollzeit').replace(/PART_TIME/gi, 'Teilzeit').replace(/CONTRACTOR/gi, 'Freie Mitarbeit').replace(/TEMPORARY/gi, 'Befristet').replace(/INTERN/gi, 'Praktikum'); if (n(mapped)) return n(mapped); const txt = n(document.body.innerText); const low = txt.toLowerCase(); const labs = ['Beschäftigungsart', 'Anstellungsart', 'Beschäftigungsausmaß']; const stops = ['Beschäftigungssituation', 'Startzeit der Beschäftigung', 'Arbeitsort', 'Erforderliche Sprachkenntnisse', 'Bruttogehalt', 'Arbeitgeber']; for (const lab of labs) { const i = low.indexOf(lab.toLowerCase()); if (i >= 0) { let start = i + lab.length, end = txt.length; for (const stop of stops) { const j2 = low.indexOf(stop.toLowerCase(), start); if (j2 >= 0 && j2 < end) end = j2; } const v = n(txt.slice(start, end).replace(/^[:\\s-]+/, '')); if (v && v.length <= 120 && !/zurück zum Suchergebnis|Wo suchst du|seite Jobs/i.test(v)) return v; } } return ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Beschäftigungssituation",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const txt = n(document.body.innerText); const low = txt.toLowerCase(); const labs = ['Beschäftigungssituation']; const stops = ['Beschäftigungsart', 'Startzeit der Beschäftigung', 'Arbeitsort', 'Erforderliche Sprachkenntnisse', 'Bruttogehalt', 'Arbeitgeber', 'Firmenprofil']; for (const lab of labs) { const i = low.indexOf(lab.toLowerCase()); if (i >= 0) { let start = i + lab.length, end = txt.length; for (const stop of stops) { const j = low.indexOf(stop.toLowerCase(), start); if (j >= 0 && j < end) end = j; } const v = n(txt.slice(start, end).replace(/^[:\\s-]+/, '')); if (v && v.length <= 80 && !/Bruttogehalt|zurück zum Suchergebnis|seite Jobs|erforderlich/i.test(v)) return v; } } return ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Startzeit_der_Beschäftigung",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const txt = n(document.body.innerText); const low = txt.toLowerCase(); const labs = ['Startzeit der Beschäftigung', 'Dienstbeginn', 'Eintritt', 'Beginn']; const stops = ['Beschäftigungsart', 'Beschäftigungssituation', 'Arbeitsort', 'Erforderliche Sprachkenntnisse', 'Bruttogehalt', 'Arbeitgeber', 'Firmenprofil']; for (const lab of labs) { const i = low.indexOf(lab.toLowerCase()); if (i >= 0) { let start = i + lab.length, end = txt.length; for (const stop of stops) { const j = low.indexOf(stop.toLowerCase(), start); if (j >= 0 && j < end) end = j; } const v = n(txt.slice(start, end).replace(/^[:\\s-]+/, '')); if (v && v.length <= 80 && !/zurück zum Suchergebnis|seite Jobs|Wo suchst du/i.test(v)) return v; } } return ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Arbeitsort",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const job = () => { for (const s of document.querySelectorAll('script[type=\"application/ld+json\"]')) { try { const v = JSON.parse(s.textContent); const arr = Array.isArray(v) ? v : [v]; const all = arr.concat(...arr.map(x => Array.isArray(x && x['@graph']) ? x['@graph'] : [])); for (const x of all) if (x && String(x['@type']).includes('JobPosting')) return x; } catch(e) {} } return {}; }; const locs = Array.isArray(job().jobLocation) ? job().jobLocation : (job().jobLocation ? [job().jobLocation] : []); const fromJson = locs.map(l => { const a = l.address || {}; return [a.addressRegion, a.postalCode, a.addressLocality, a.streetAddress].map(n).filter(Boolean).join(', '); }).filter(Boolean).join(' | '); if (fromJson) return fromJson; const txt = n(document.body.innerText); const low = txt.toLowerCase(); const labs = ['Arbeitsort', 'Dienstort', 'Standort']; const stops = ['Beschäftigungsart', 'Beschäftigungssituation', 'Startzeit der Beschäftigung', 'Erforderliche Sprachkenntnisse', 'Bruttogehalt', 'Arbeitgeber']; for (const lab of labs) { const i = low.indexOf(lab.toLowerCase()); if (i >= 0) { let start = i + lab.length, end = txt.length; for (const stop of stops) { const j = low.indexOf(stop.toLowerCase(), start); if (j >= 0 && j < end) end = j; } const v = n(txt.slice(start, end).replace(/^[:\\s-]+/, '')); if (v && v.length <= 160 && !/Wo suchst du|zurück zum Suchergebnis|seite Jobs/i.test(v)) return v; } } return ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Erforderliche_Sprachkenntnisse",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const txt = n(document.body.innerText); const low = txt.toLowerCase(); const labs = ['Erforderliche Sprachkenntnisse', 'Sprachkenntnisse', 'Sprachen']; const stops = ['Beschäftigungsart', 'Beschäftigungssituation', 'Startzeit der Beschäftigung', 'Arbeitsort', 'Bruttogehalt', 'Arbeitgeber']; for (const lab of labs) { const i = low.indexOf(lab.toLowerCase()); if (i >= 0) { let start = i + lab.length, end = txt.length; for (const stop of stops) { const j = low.indexOf(stop.toLowerCase(), start); if (j >= 0 && j < end) end = j; } const v = n(txt.slice(start, end).replace(/^[:\\s-]+/, '')); if (v && v.length <= 120 && !/Bruttogehalt|zurück zum Suchergebnis|seite Jobs/i.test(v)) return v; } } const m = txt.match(/\\b(Deutsch|Englisch|Französisch|Italienisch|Spanisch)\\b/i); return m ? m[1] : ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Bruttogehalt",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const txt = n(document.body.innerText); const low = txt.toLowerCase(); const labs = ['Bruttogehalt', 'Gehalt', 'Mindestgehalt', 'Bezahlung', 'Entlohnung']; const stops = ['Beschäftigungsart', 'Beschäftigungssituation', 'Startzeit der Beschäftigung', 'Arbeitsort', 'Erforderliche Sprachkenntnisse', 'Arbeitgeber', 'Firmenprofil']; for (const lab of labs) { const i = low.indexOf(lab.toLowerCase()); if (i >= 0) { let start = i + lab.length, end = txt.length; for (const stop of stops) { const j = low.indexOf(stop.toLowerCase(), start); if (j >= 0 && j < end) end = j; } const v = n(txt.slice(start, end).replace(/^[:\\s-]+/, '')); if (v && v.length <= 180 && !/zurück zum Suchergebnis|seite Jobs/i.test(v)) return v; } } const job = () => { for (const s of document.querySelectorAll('script[type=\"application/ld+json\"]')) { try { const v = JSON.parse(s.textContent); const arr = Array.isArray(v) ? v : [v]; const all = arr.concat(...arr.map(x => Array.isArray(x && x['@graph']) ? x['@graph'] : [])); for (const x of all) if (x && String(x['@type']).includes('JobPosting')) return x; } catch(e) {} } return {}; }; const bs = job().baseSalary || {}; const val = bs.value || {}; return n([val.minValue || val.value, val.maxValue, bs.currency || val.currency, val.unitText].filter(Boolean).join(' ')); })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Arbeitgeber",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const job = () => { for (const s of document.querySelectorAll('script[type=\"application/ld+json\"]')) { try { const v = JSON.parse(s.textContent); const arr = Array.isArray(v) ? v : [v]; const all = arr.concat(...arr.map(x => Array.isArray(x && x['@graph']) ? x['@graph'] : [])); for (const x of all) if (x && String(x['@type']).includes('JobPosting')) return x; } catch(e) {} } return {}; }; const org = job().hiringOrganization || {}; const fromLink = n(document.querySelector('a[href*=\"/jobs/firma/\"]')?.innerText).replace(/\\s+Jobs$/, ''); return n(org.name) || fromLink; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Gründungsjahr",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const txt = n(document.body.innerText); const m = txt.match(/(?:Gründungsjahr|Gegründet|Gründung)\\s*:?\\s*(\\d{4})/i); return m ? m[1] : ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Aktuelles_Job",
            "selector": "(() => { const n = s => (s || '').toString().replace(/\\s+/g, ' ').trim(); const a = document.querySelector('a[href*=\"/jobs/firma/\"]'); const scope = a ? (a.closest('section, article, div') || a.parentElement || document.body) : document.body; const txt = n(scope.innerText); const m = txt.match(/(\\d+)\\s*(?:aktuelle\\s*)?Jobs?/i) || n(document.body.innerText).match(/(\\d+)\\s*(?:aktuelle\\s*)?Jobs?/i); return m ? m[1] : ''; })()",
            "attribute": "text",
            "isJs": true
          },
          {
            "name": "Firmenprofil",
            "selector": "(() => { const a = Array.from(document.querySelectorAll('a[href*=\"/jobs/firma/\"]'))[0]; return a ? new URL(a.getAttribute('href'), location.href).href : ''; })()",
            "attribute": "text",
            "isJs": true
          }
        ]
      }
    },
    {
      "block_id": "loop-continue-1",
      "block_type": "process",
      "title": "Loop Continue",
      "description": "Continue multi-input loop",
      "position_x": 3720,
      "position_y": 240,
      "config": {
        "color": "bg-[#8d8d8d]"
      }
    }
  ],
  "connections": [
    {
      "from_block_id": "set-window-size-1",
      "from_connector_id": "right",
      "to_block_id": "navigate-1",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "navigate-1",
      "from_connector_id": "right",
      "to_block_id": "wait-for-page-load-1",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "wait-for-page-load-1",
      "from_connector_id": "right",
      "to_block_id": "inject-javascript-1",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "inject-javascript-1",
      "from_connector_id": "right",
      "to_block_id": "sleep-1",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "sleep-1",
      "from_connector_id": "right",
      "to_block_id": "inject-javascript-2",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "inject-javascript-2",
      "from_connector_id": "right",
      "to_block_id": "wait-for-page-load-2",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "wait-for-page-load-2",
      "from_connector_id": "right",
      "to_block_id": "sleep-2",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "sleep-2",
      "from_connector_id": "right",
      "to_block_id": "wait-for-element-1",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "wait-for-element-1",
      "from_connector_id": "right",
      "to_block_id": "structured-export-1",
      "to_connector_id": "left"
    },
    {
      "from_block_id": "structured-export-1",
      "from_connector_id": "right",
      "to_block_id": "loop-continue-1",
      "to_connector_id": "left"
    }
  ],
  "canvas_elements": [
    {
      "id": "group-entry",
      "element_type": "group",
      "title": "Entry & Setup",
      "color": "#4589ff",
      "position_x": 48,
      "position_y": 136,
      "width": 380,
      "height": 296,
      "z_index": 20,
      "data": {
        "memberBlockIds": [
          "set-window-size-1"
        ]
      }
    },
    {
      "id": "group-load",
      "element_type": "group",
      "title": "Page Load",
      "color": "#08bdba",
      "position_x": 408,
      "position_y": 136,
      "width": 2840,
      "height": 296,
      "z_index": 20,
      "data": {
        "memberBlockIds": [
          "navigate-1",
          "wait-for-page-load-1",
          "sleep-1",
          "wait-for-page-load-2",
          "sleep-2",
          "wait-for-element-1"
        ]
      }
    },
    {
      "id": "group-interaction",
      "element_type": "group",
      "title": "Interaction",
      "color": "#a56eff",
      "position_x": 1128,
      "position_y": 136,
      "width": 1040,
      "height": 296,
      "z_index": 20,
      "data": {
        "memberBlockIds": [
          "inject-javascript-1",
          "inject-javascript-2"
        ]
      }
    },
    {
      "id": "group-extract",
      "element_type": "group",
      "title": "Data Extraction",
      "color": "#42be65",
      "position_x": 3288,
      "position_y": 136,
      "width": 380,
      "height": 296,
      "z_index": 20,
      "data": {
        "memberBlockIds": [
          "structured-export-1"
        ]
      }
    },
    {
      "id": "group-pagination",
      "element_type": "group",
      "title": "Pagination Loop",
      "color": "#ff832b",
      "position_x": 3648,
      "position_y": 136,
      "width": 380,
      "height": 296,
      "z_index": 20,
      "data": {
        "memberBlockIds": [
          "loop-continue-1"
        ]
      }
    },
    {
      "id": "note-overview",
      "element_type": "note",
      "title": "Overview",
      "content": "Scrapes Willhaben.at job detail pages by URL, matching the Octoparse detail-page fields: Original_URL, Titel, Beschäftigungsart, Beschäftigungssituation, Startzeit_der_Beschäftigung, Arbeitsort, Erforderliche_Sprachkenntnisse, Bruttogehalt, Arbeitgeber, Gründungsjahr, Aktuelles_Job, and Firmenprofil. Navigation strategy: multi-URL detail-page loop using navigate.urls[] plus loop-continue. Replace or extend navigate-1.config.urls with the complete set of Willhaben job detail URLs to scrape. If an expired detail URL redirects to a similar-jobs search page, the workflow attempts to open the first current job detail result before extraction.",
      "color": "#f1c21b",
      "position_x": 80,
      "position_y": 20,
      "width": 480,
      "height": 160,
      "z_index": 22,
      "data": {}
    },
    {
      "id": "note-block-navigate-1",
      "element_type": "note",
      "title": "Note: Navigate",
      "content": "Multi-URL loop over 2 pages. Pair with loop-continue at the end of each iteration.",
      "color": "#ee5396",
      "position_x": 680,
      "position_y": 220,
      "width": 328,
      "height": 107,
      "z_index": 22,
      "data": {
        "block_id": "navigate-1"
      }
    },
    {
      "id": "note-block-inject-javascript-1",
      "element_type": "note",
      "title": "Note: Inject JavaScript",
      "content": "Runs custom JavaScript in the page: `try { const labels = ['Accept', 'Akzeptieren', 'Alle akzeptieren', 'Zustimmen', 'Einverstanden', 'OK...` Verify in browser if results are empty.",
      "color": "#ee5396",
      "position_x": 1400,
      "position_y": 220,
      "width": 340,
      "height": 140,
      "z_index": 22,
      "data": {
        "block_id": "inject-javascript-1"
      }
    },
    {
      "id": "note-block-inject-javascript-2",
      "element_type": "note",
      "title": "Note: Inject JavaScript",
      "content": "Runs custom JavaScript in the page: `try { if (!location.pathname.includes('/jobs/job/')) { const links = Array.from(document.querySelect...` Verify in browser if results are empty.",
      "color": "#ee5396",
      "position_x": 2120,
      "position_y": 220,
      "width": 340,
      "height": 140,
      "z_index": 22,
      "data": {
        "block_id": "inject-javascript-2"
      }
    },
    {
      "id": "note-block-structured-export-1",
      "element_type": "note",
      "title": "Note: Structured Export",
      "content": "Structured export with JS columns (Original_URL, Titel, Beschäftigungsart, Beschäftigungssituation, Startzeit_der_Beschäftigung). These selectors are fragile — update if the site layout changes.",
      "color": "#ee5396",
      "position_x": 3560,
      "position_y": 220,
      "width": 340,
      "height": 144,
      "z_index": 22,
      "data": {
        "block_id": "structured-export-1"
      }
    },
    {
      "id": "note-block-loop-continue-1",
      "element_type": "note",
      "title": "Note: Loop Continue",
      "content": "Loop Continue advances a multi-URL or multi-text loop. Place at the end of the loop body with a clear back-edge to the loop start.",
      "color": "#ee5396",
      "position_x": 3920,
      "position_y": 220,
      "width": 340,
      "height": 123,
      "z_index": 22,
      "data": {
        "block_id": "loop-continue-1"
      }
    }
  ]
}