Coverage report: 67%

Files Functions Classes

coverage.py v7.6.4, created at 2024-11-20 09:03 +0000

File function statements missing excluded branches partial coverage
src/crawler/augment.py augment_article 9 9 0 8 0 0%
src/crawler/augment.py update_article 29 29 0 14 0 0%
src/crawler/augment.py fetch_article_data 18 18 0 10 0 0%
src/crawler/augment.py (no function) 8 8 0 0 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.__init__ 21 21 0 0 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.parse_collection_content 1 1 0 0 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.parse_issue_content 0 0 0 0 0 100%
src/crawler/base_crawler.py BaseCollectionCrawler.parse_article_content 1 1 0 0 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.crawl_collection 20 20 0 10 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.crawl_collection.iterate_xissues 7 7 0 4 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.crawl_issue 20 20 0 16 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.crawl_one_issue_url 13 13 0 8 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.crawl_article 15 2 0 6 2 81%
src/crawler/base_crawler.py BaseCollectionCrawler.process_article_metadata 15 0 0 6 0 100%
src/crawler/base_crawler.py BaseCollectionCrawler.download_file 22 5 0 10 3 75%
src/crawler/base_crawler.py BaseCollectionCrawler.decode_response 1 0 0 0 0 100%
src/crawler/base_crawler.py BaseCollectionCrawler.get_page_content 5 0 0 0 0 100%
src/crawler/base_crawler.py BaseCollectionCrawler.get_page_content.set_progress_bar_title 7 5 0 6 1 23%
src/crawler/base_crawler.py BaseCollectionCrawler.get_or_create_source 6 6 0 0 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.get_or_create_periode 10 10 0 6 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.merge_xissues 48 48 0 26 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.add_xissue_into_database 16 16 0 2 0 0%
src/crawler/base_crawler.py BaseCollectionCrawler.get_metadata_using_citation_meta 85 12 0 68 16 78%
src/crawler/base_crawler.py BaseCollectionCrawler.create_crawled_bibitem 13 1 0 6 2 84%
src/crawler/base_crawler.py BaseCollectionCrawler.create_bibliography 13 0 0 4 0 100%
src/crawler/base_crawler.py add_pdf_link_to_xarticle 4 0 0 0 0 100%
src/crawler/base_crawler.py (no function) 50 0 0 0 0 100%
src/crawler/by_source/amc_crawler.py AmcCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/amc_crawler.py AmcCrawler.parse_collection_content 6 0 0 0 0 100%
src/crawler/by_source/amc_crawler.py AmcCrawler.parse_one_issues_page 21 0 0 6 0 100%
src/crawler/by_source/amc_crawler.py AmcCrawler.parse_issue_content 26 6 0 14 4 70%
src/crawler/by_source/amc_crawler.py AmcCrawler.parse_article_content 49 2 0 30 13 81%
src/crawler/by_source/amc_crawler.py (no function) 14 0 0 0 0 100%
src/crawler/by_source/amp_crawler.py AmpCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/amp_crawler.py AmpCrawler.parse_collection_content 11 0 0 6 1 94%
src/crawler/by_source/amp_crawler.py AmpCrawler.create_xissue 26 0 0 8 0 100%
src/crawler/by_source/amp_crawler.py AmpCrawler.parse_issue_content 10 0 0 4 1 93%
src/crawler/by_source/amp_crawler.py AmpCrawler.parse_article_content 31 0 0 18 6 88%
src/crawler/by_source/amp_crawler.py (no function) 16 0 0 0 0 100%
src/crawler/by_source/arsia_crawler.py ArsiaCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/arsia_crawler.py ArsiaCrawler.parse_collection_content 15 0 0 4 0 100%
src/crawler/by_source/arsia_crawler.py (no function) 11 0 0 0 0 100%
src/crawler/by_source/bdim_crawler.py BdimCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/bdim_crawler.py BdimCrawler.parse_collection_content 18 0 0 4 1 95%
src/crawler/by_source/bdim_crawler.py BdimCrawler.get_year 3 1 0 2 1 60%
src/crawler/by_source/bdim_crawler.py BdimCrawler.create_xissue 9 0 0 0 0 100%
src/crawler/by_source/bdim_crawler.py BdimCrawler.parse_issue_content 10 0 0 4 1 93%
src/crawler/by_source/bdim_crawler.py BdimCrawler.parse_article_content 92 2 0 52 13 90%
src/crawler/by_source/bdim_crawler.py BdimCrawler.parse_bibitem_tag 39 2 0 26 3 92%
src/crawler/by_source/bdim_crawler.py BdimCrawler.parse_a_tag 14 2 0 8 2 82%
src/crawler/by_source/bdim_crawler.py BdimCrawler.parse_biblio_author_tag 22 2 0 12 3 85%
src/crawler/by_source/bdim_crawler.py (no function) 32 0 0 0 0 100%
src/crawler/by_source/da_crawler.py DaCrawler.__init__ 5 5 0 0 0 0%
src/crawler/by_source/da_crawler.py DaCrawler.parse_collection_content 15 15 0 4 0 0%
src/crawler/by_source/da_crawler.py DaCrawler.parse_article_content 18 3 0 6 3 75%
src/crawler/by_source/da_crawler.py (no function) 13 0 0 0 0 100%
src/crawler/by_source/dmlcz_crawler.py DmlczCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/dmlcz_crawler.py DmlczCrawler.parse_collection_content 29 0 0 14 5 88%
src/crawler/by_source/dmlcz_crawler.py DmlczCrawler.get_year 3 1 0 2 1 60%
src/crawler/by_source/dmlcz_crawler.py DmlczCrawler.create_xissue 13 2 0 0 0 85%
src/crawler/by_source/dmlcz_crawler.py DmlczCrawler.parse_issue_content 13 0 0 6 2 89%
src/crawler/by_source/dmlcz_crawler.py DmlczCrawler.parse_article_content 53 11 0 26 11 72%
src/crawler/by_source/dmlcz_crawler.py (no function) 19 0 0 0 0 100%
src/crawler/by_source/elibm_crawler.py ElibmCrawler.__init__ 5 5 0 2 0 0%
src/crawler/by_source/elibm_crawler.py ElibmCrawler.parse_collection_content 18 1 0 10 3 86%
src/crawler/by_source/elibm_crawler.py ElibmCrawler.get_first_year 3 1 0 2 1 60%
src/crawler/by_source/elibm_crawler.py ElibmCrawler.create_xissue 23 7 0 4 2 67%
src/crawler/by_source/elibm_crawler.py ElibmCrawler.parse_issue_content 19 7 0 10 3 59%
src/crawler/by_source/elibm_crawler.py ElibmCrawler.parse_article_content 74 9 0 38 9 82%
src/crawler/by_source/elibm_crawler.py (no function) 17 0 0 0 0 100%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.parse_collection_content 71 19 0 36 7 70%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.create_xissue 15 0 0 6 0 100%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.parse_article_content 106 77 0 50 14 28%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.parse_bibtex 51 51 0 34 0 0%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.get_page_content 7 0 0 2 0 100%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.get_page_content.set_progress_bar_title 3 1 0 2 1 60%
src/crawler/by_source/eudml_crawler.py EudmlCrawler.download_file_dynamic 22 22 0 10 0 0%
src/crawler/by_source/eudml_crawler.py (no function) 24 0 0 0 0 100%
src/crawler/by_source/hdml_crawler.py HdmlCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/hdml_crawler.py HdmlCrawler.parse_collection_content 13 0 0 4 1 94%
src/crawler/by_source/hdml_crawler.py HdmlCrawler.crawl_one_issue_url 3 3 0 0 0 0%
src/crawler/by_source/hdml_crawler.py HdmlCrawler.create_xissue 15 0 0 6 3 86%
src/crawler/by_source/hdml_crawler.py HdmlCrawler.parse_issue_content 12 0 0 4 1 94%
src/crawler/by_source/hdml_crawler.py HdmlCrawler.parse_article_content 39 5 0 12 5 80%
src/crawler/by_source/hdml_crawler.py (no function) 24 0 0 0 0 100%
src/crawler/by_source/impan_crawler.py ImpanCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/impan_crawler.py ImpanCrawler.parse_collection_content 34 8 0 22 7 73%
src/crawler/by_source/impan_crawler.py ImpanCrawler.create_xissue 15 3 0 4 2 74%
src/crawler/by_source/impan_crawler.py ImpanCrawler.parse_issue_content 18 4 0 10 4 71%
src/crawler/by_source/impan_crawler.py ImpanCrawler.parse_article_content 31 6 0 16 8 70%
src/crawler/by_source/impan_crawler.py (no function) 19 0 0 0 0 100%
src/crawler/by_source/nsjom/nsjom_1971_crawler.py parse_collection_content 12 3 0 2 0 79%
src/crawler/by_source/nsjom/nsjom_1971_crawler.py parse_issue_content 1 0 0 0 0 100%
src/crawler/by_source/nsjom/nsjom_1971_crawler.py parse_year 10 1 0 4 1 86%
src/crawler/by_source/nsjom/nsjom_1971_crawler.py parse_issue_tag 29 6 0 12 3 78%
src/crawler/by_source/nsjom/nsjom_1971_crawler.py parse_article_tag 31 3 0 14 4 84%
src/crawler/by_source/nsjom/nsjom_1971_crawler.py (no function) 15 1 0 2 1 88%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py parse_collection_content 8 0 0 2 0 100%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py is_heading 12 3 0 10 1 73%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py parse_issue_content 1 1 0 0 0 0%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py parse_year 18 1 0 10 1 93%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py parse_issue_tags 31 6 0 16 7 72%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py parse_article 24 4 0 10 4 76%
src/crawler/by_source/nsjom/nsjom_2010_crawler.py (no function) 16 1 0 2 1 89%
src/crawler/by_source/nsjom/nsjom_xml_crawler.py parse_collection_content 33 3 0 16 3 88%
src/crawler/by_source/nsjom/nsjom_xml_crawler.py parse_issue_content 1 0 0 0 0 100%
src/crawler/by_source/nsjom/nsjom_xml_crawler.py parse_issue_tag 3 0 0 0 0 100%
src/crawler/by_source/nsjom/nsjom_xml_crawler.py parse_article 68 4 0 38 13 84%
src/crawler/by_source/nsjom/nsjom_xml_crawler.py (no function) 12 1 0 2 1 86%
src/crawler/by_source/nsjom_crawler.py NsjomCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/nsjom_crawler.py NsjomCrawler.parse_collection_content 4 0 0 2 0 100%
src/crawler/by_source/nsjom_crawler.py NsjomCrawler.parse_issue_content 5 1 0 4 1 78%
src/crawler/by_source/nsjom_crawler.py NsjomCrawler.decode_response 12 10 0 0 0 17%
src/crawler/by_source/nsjom_crawler.py (no function) 21 0 0 0 0 100%
src/crawler/by_source/numdam_crawler.py NumdamCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/numdam_crawler.py NumdamCrawler.crawl_collection 1 1 0 0 0 0%
src/crawler/by_source/numdam_crawler.py (no function) 9 9 0 0 0 0%
src/crawler/by_source/sasa_crawler.py SasaCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/sasa_crawler.py SasaCrawler.parse_collection_content 32 6 0 20 7 75%
src/crawler/by_source/sasa_crawler.py SasaCrawler.create_xissue 11 1 0 4 1 87%
src/crawler/by_source/sasa_crawler.py SasaCrawler.parse_issue_content 21 4 0 12 4 76%
src/crawler/by_source/sasa_crawler.py SasaCrawler.parse_sasa_article 71 4 0 40 10 87%
src/crawler/by_source/sasa_crawler.py SasaCrawler.fetch_sasa_abstract 8 1 0 2 1 80%
src/crawler/by_source/sasa_crawler.py SasaCrawler.decode_response 8 6 0 0 0 25%
src/crawler/by_source/sasa_crawler.py (no function) 18 0 0 0 0 100%
src/crawler/by_source/tac_crawler.py TacCrawler.__init__ 3 3 0 0 0 0%
src/crawler/by_source/tac_crawler.py TacCrawler.parse_collection_content 32 0 0 14 0 100%
src/crawler/by_source/tac_crawler.py TacCrawler.create_xissue 29 0 0 8 0 100%
src/crawler/by_source/tac_crawler.py TacCrawler.parse_article_content 58 2 0 28 5 92%
src/crawler/by_source/tac_crawler.py TacCrawler.insert_kwd 10 0 0 4 0 100%
src/crawler/by_source/tac_crawler.py (no function) 16 0 0 0 0 100%
src/crawler/crawler_types.py (no function) 12 0 0 0 0 100%
src/crawler/factory.py crawler_factory 4 4 0 0 0 0%
src/crawler/factory.py (no function) 15 15 0 0 0 0%
src/crawler/models.py SourceManager.get_by_natural_key 1 1 0 0 0 0%
src/crawler/models.py Source.natural_key 1 1 0 0 0 0%
src/crawler/models.py Source.__str__ 1 1 0 0 0 0%
src/crawler/models.py PeriodeManager.get_by_natural_key 1 1 0 0 0 0%
src/crawler/models.py Periode.natural_key 1 1 0 0 0 0%
src/crawler/models.py Periode.__str__ 1 1 0 0 0 0%
src/crawler/models.py (no function) 38 0 0 0 0 100%
src/crawler/utils.py insert_crawl_event_in_history 7 7 0 2 0 0%
src/crawler/utils.py get_cached_html_folder 5 5 0 2 0 0%
src/crawler/utils.py col_has_source 1 1 0 0 0 0%
src/crawler/utils.py get_cols_by_source 2 2 0 0 0 0%
src/crawler/utils.py get_all_cols 2 2 0 0 0 0%
src/crawler/utils.py read_json 2 2 0 0 0 0%
src/crawler/utils.py get_numdam_collections 8 8 0 4 0 0%
src/crawler/utils.py get_or_create_collection 26 26 0 12 0 0%
src/crawler/utils.py cleanup_str 2 0 0 0 0 100%
src/crawler/utils.py (no function) 25 0 0 0 0 100%
src/crawler/zbmath.py zbmath_request_article 49 49 0 20 0 0%
src/crawler/zbmath.py (no function) 8 8 0 0 0 0%
Total   2733 789 0 1068 235 67%

No items found using the specified filter.