Summary SheetΒΆ
Example
>>> from techminer2.database.tools import SummarySheet
>>> df = (
... SummarySheet()
... #
... .where_root_directory_is("examples/fintech/")
... .where_database_is("main")
... .where_record_years_range_is(None, None)
... .where_record_citations_range_is(None, None)
... #
... .run()
... )
>>> print(df.to_string(index=True))
column number of records coverage (%)
0 abbr_source_title 50 100.00%
1 abstract 48 96.00%
2 abstract_nouns_and_phrases 48 96.00%
3 affiliations 49 98.00%
4 author_full_names 50 100.00%
5 author_keywords 38 76.00%
6 authors 50 100.00%
7 authors_id 50 100.00%
8 authors_with_affiliations 49 98.00%
9 coden 12 24.00%
10 conference_code 3 6.00%
11 conference_date 3 6.00%
12 conference_location 3 6.00%
13 conference_name 3 6.00%
14 correspondence_address 34 68.00%
15 countries 49 98.00%
16 country_1st_author 49 98.00%
17 db_cited_by 50 100.00%
18 db_main 50 100.00%
19 db_references 50 100.00%
20 descriptors 50 100.00%
21 document_title 50 100.00%
22 document_title_nouns_and_phrases 50 100.00%
23 document_type 50 100.00%
24 doi 45 90.00%
25 editors 2 4.00%
26 eid 50 100.00%
27 funding_details 17 34.00%
28 funding_texts 17 34.00%
29 global_citations 50 100.00%
30 global_references 19 38.00%
31 index_keywords 19 38.00%
32 isbn 3 6.00%
33 issn 48 96.00%
34 issue 39 78.00%
35 keywords 42 84.00%
36 language 50 100.00%
37 link 50 100.00%
38 local_citations 50 100.00%
39 local_references 19 38.00%
40 nouns_and_phrases 50 100.00%
41 num_authors 50 100.00%
42 open_access 25 50.00%
43 organization_1st_author 49 98.00%
44 organizations 49 98.00%
45 page_count 43 86.00%
46 page_end 43 86.00%
47 page_start 43 86.00%
48 publication_stage 50 100.00%
49 publisher 50 100.00%
50 raw_abstract 50 100.00%
51 raw_abstract_nouns_and_phrases 48 96.00%
52 raw_abstract_spacy_phrases 0 0.00%
53 raw_author_keywords 38 76.00%
54 raw_authors 50 100.00%
55 raw_authors_id 50 100.00%
56 raw_descriptors 50 100.00%
57 raw_document_title 50 100.00%
58 raw_document_title_nouns_and_phrases 50 100.00%
59 raw_document_type 50 100.00%
60 raw_global_references 49 98.00%
61 raw_index_keywords 19 38.00%
62 raw_keywords 42 84.00%
63 raw_nouns_and_phrases 50 100.00%
64 raw_source_title 50 100.00%
65 raw_spacy_phrases 50 100.00%
66 raw_textblob_phrases 49 98.00%
67 record_id 50 100.00%
68 record_no 50 100.00%
69 regions 49 98.00%
70 scopus_art_no 6 12.00%
71 source 50 100.00%
72 source_title 50 100.00%
73 sponsors 1 2.00%
74 subject_areas 47 94.00%
75 subregions 49 98.00%
76 tokenized_abstract 48 96.00%
77 tokenized_document_title 50 100.00%
78 volume 48 96.00%
79 year 50 100.00%