doc_curation.wikisource

Wikisource scraping.

doc_curation.wikisource.dump_deep_text(url_text_id, url_leaf_id_padding, dir_path, unit_info_file, get_collapsible_content=False, dry_run=False)[source]
doc_curation.wikisource.dump_item(title, item_url, outfile_path, get_collapsible_content)[source]
doc_curation.wikisource.dump_text(url_base, num_parts, dir_path, url_id_padding='%d', get_collapsible_content=False, transliterate_id=True)[source]
doc_curation.wikisource.get_item_url_suffix(id, id_base, url_id_padding='%d', transliterate_id=True)[source]
doc_curation.wikisource.get_wiki_path(subunit_path, unit_data, url_id_padding='%2d')[source]