{"id":"7c090529-fbfe-4f4d-82d7-508eab83af69","shortId":"VCGgBg","kind":"skill","title":"Scrapy Pipeline Data Extractor","tagline":"Builds production Scrapy spiders with custom Item Pipelines for data cleaning and storage. Uses scrapy.linkextractors.LinkExtractor for crawl scoping and ItemLoader with MapCompose processors for field normalization.","description":"# Scrapy Pipeline Data Extractor\n\nBuilds production Scrapy spiders with custom Item Pipelines for data cleaning and storage. Uses scrapy.linkextractors.LinkExtractor for crawl scoping and ItemLoader with MapCompose processors for field normalization.\n\n## Installation\n\nUse the upstream install or setup path that matches your environment:\n- pip install scrapy\n\nRequirements and caveats from upstream:\n- :alt: Supported Python Versions\n- It is cross-platform, and requires Python 3.10+. It is maintained by Zyte_\n\nBasic usage or getting-started notes:\n- .. code:: bash\n- And follow the documentation_ to learn how to use it.\n- .. _documentation: https://docs.scrapy.org/en/latest/\n\n- Source: https://github.com/scrapy/scrapy\n- Extracted from upstream docs: https://raw.githubusercontent.com/scrapy/scrapy/HEAD/README.rst\n\n## Source\n\n- [Agent Skill Exchange](https://agentskillexchange.com/skills/scrapy-pipeline-data-extractor/)","tags":["scrapy","pipeline","data","extractor","skills","agentskillexchange","agent-skills","ai-agents","ai-tools","awesome-list","claude-code","codex"],"capabilities":["skill","source-agentskillexchange","skill-scrapy-pipeline-data-extractor","topic-agent-skills","topic-ai-agents","topic-ai-tools","topic-awesome-list","topic-claude-code","topic-codex","topic-cursor","topic-llm","topic-mcp","topic-npx-skills","topic-openclaw","topic-skills-catalog"],"categories":["skills"],"synonyms":[],"warnings":[],"endpointUrl":"https://skills.sh/agentskillexchange/skills/scrapy-pipeline-data-extractor","protocol":"skill","transport":"skills-sh","auth":{"type":"none","details":{"cli":"npx skills add agentskillexchange/skills","source_repo":"https://github.com/agentskillexchange/skills","install_from":"skills.sh"}},"qualityScore":"0.454","qualityRationale":"deterministic score 0.45 from registry signals: · indexed on github topic:agent-skills · 8 github stars · SKILL.md body (927 chars)","verified":false,"liveness":"unknown","lastLivenessCheck":null,"agentReviews":{"count":0,"score_avg":null,"cost_usd_avg":null,"success_rate":null,"latency_p50_ms":null,"narrative_summary":null,"summary_updated_at":null},"enrichmentModel":"deterministic:skill-github:v1","enrichmentVersion":1,"enrichedAt":"2026-05-18T19:12:20.219Z","embedding":null,"createdAt":"2026-05-18T13:19:12.021Z","updatedAt":"2026-05-18T19:12:20.219Z","lastSeenAt":"2026-05-18T19:12:20.219Z","tsv":"'/en/latest/':121 '/scrapy/scrapy':125 '/scrapy/scrapy/head/readme.rst':132 '/skills/scrapy-pipeline-data-extractor/)':139 '3.10':93 'agent':134 'agentskillexchange.com':138 'agentskillexchange.com/skills/scrapy-pipeline-data-extractor/)':137 'alt':81 'bash':107 'basic':99 'build':5,35 'caveat':78 'clean':15,45 'code':106 'crawl':21,51 'cross':88 'cross-platform':87 'custom':10,40 'data':3,14,33,44 'doc':129 'docs.scrapy.org':120 'docs.scrapy.org/en/latest/':119 'document':111,118 'environ':72 'exchang':136 'extract':126 'extractor':4,34 'field':29,59 'follow':109 'get':103 'getting-start':102 'github.com':124 'github.com/scrapy/scrapy':123 'instal':61,65,74 'item':11,41 'itemload':24,54 'learn':113 'maintain':96 'mapcompos':26,56 'match':70 'normal':30,60 'note':105 'path':68 'pip':73 'pipelin':2,12,32,42 'platform':89 'processor':27,57 'product':6,36 'python':83,92 'raw.githubusercontent.com':131 'raw.githubusercontent.com/scrapy/scrapy/head/readme.rst':130 'requir':76,91 'scope':22,52 'scrapi':1,7,31,37,75 'scrapy.linkextractors.linkextractor':19,49 'setup':67 'skill':135 'skill-scrapy-pipeline-data-extractor' 'sourc':122,133 'source-agentskillexchange' 'spider':8,38 'start':104 'storag':17,47 'support':82 'topic-agent-skills' 'topic-ai-agents' 'topic-ai-tools' 'topic-awesome-list' 'topic-claude-code' 'topic-codex' 'topic-cursor' 'topic-llm' 'topic-mcp' 'topic-npx-skills' 'topic-openclaw' 'topic-skills-catalog' 'upstream':64,80,128 'usag':100 'use':18,48,62,116 'version':84 'zyte':98","prices":[{"id":"db193d06-85ab-42f4-bda2-55bbad7159a4","listingId":"7c090529-fbfe-4f4d-82d7-508eab83af69","amountUsd":"0","unit":"free","nativeCurrency":null,"nativeAmount":null,"chain":null,"payTo":null,"paymentMethod":"skill-free","isPrimary":true,"details":{"org":"agentskillexchange","category":"skills","install_from":"skills.sh"},"createdAt":"2026-05-18T13:19:12.021Z"}],"sources":[{"listingId":"7c090529-fbfe-4f4d-82d7-508eab83af69","source":"github","sourceId":"agentskillexchange/skills/scrapy-pipeline-data-extractor","sourceUrl":"https://github.com/agentskillexchange/skills/tree/main/skills/scrapy-pipeline-data-extractor","isPrimary":false,"firstSeenAt":"2026-05-18T13:19:12.021Z","lastSeenAt":"2026-05-18T19:12:20.219Z"}],"details":{"listingId":"7c090529-fbfe-4f4d-82d7-508eab83af69","quickStartSnippet":null,"exampleRequest":null,"exampleResponse":null,"schema":null,"openapiUrl":null,"agentsTxtUrl":null,"citations":[],"useCases":[],"bestFor":[],"notFor":[],"kindDetails":{"org":"agentskillexchange","slug":"scrapy-pipeline-data-extractor","github":{"repo":"agentskillexchange/skills","stars":8,"topics":["agent-skills","ai-agents","ai-tools","awesome-list","claude-code","codex","cursor","llm","mcp","npx-skills","openclaw","skills-catalog"],"license":"mit","html_url":"https://github.com/agentskillexchange/skills","pushed_at":"2026-05-18T19:02:17Z","description":"The open catalog of AI agent skills — 2,000+ security-scanned skills for Claude Code, Cursor, Codex, and more.","skill_md_sha":"e1a43bc7b7ffcf6904afc01569db7554774e5a9f","skill_md_path":"skills/scrapy-pipeline-data-extractor/SKILL.md","default_branch":"main","skill_tree_url":"https://github.com/agentskillexchange/skills/tree/main/skills/scrapy-pipeline-data-extractor"},"layout":"multi","source":"github","category":"skills","frontmatter":{"name":"Scrapy Pipeline Data Extractor","description":"Builds production Scrapy spiders with custom Item Pipelines for data cleaning and storage. Uses scrapy.linkextractors.LinkExtractor for crawl scoping and ItemLoader with MapCompose processors for field normalization."},"skills_sh_url":"https://skills.sh/agentskillexchange/skills/scrapy-pipeline-data-extractor"},"updatedAt":"2026-05-18T19:12:20.219Z"}}