Sort by OccurrencesΒΆ
Example
>>> # TEST PREPARATION
>>> import sys
>>> from io import StringIO
>>> from techminer2.thesaurus.user import InitializeThesaurus, SortByOccurrences
>>> # Redirecting stderr to avoid messages during doctests
>>> original_stderr = sys.stderr
>>> sys.stderr = StringIO()
>>> # Reset the thesaurus to initial state
>>> InitializeThesaurus(thesaurus_file="demo.the.txt", field="raw_descriptors",
... root_directory="examples/fintech/", quiet=True).run()
>>> # Creates, configures, an run the sorter
>>> sorter = (
... SortByOccurrences(use_colorama=False)
... .with_thesaurus_file("demo.the.txt")
... .with_field("raw_descriptors")
... .where_root_directory_is("examples/fintech/")
... )
>>> sorter.run()
>>> # Capture and print stderr output to test the code using doctest
>>> output = sys.stderr.getvalue()
>>> sys.stderr = StringIO()
>>> print(output)
Sorting thesaurus by occurrences...
File : examples/fintech/data/thesaurus/demo.the.txt
Sorting process completed successfully
Printing thesaurus header
File : examples/fintech/data/thesaurus/demo.the.txt
FINTECH
FINTECH; FINTECHS
FINANCE
FINANCE
TECHNOLOGIES
TECHNOLOGIES; TECHNOLOGY
INNOVATION
INNOVATION; INNOVATIONS
FINANCIAL_SERVICE
FINANCIAL_SERVICE; FINANCIAL_SERVICES
FINANCIAL_TECHNOLOGIES
FINANCIAL_TECHNOLOGIES; FINANCIAL_TECHNOLOGY
BANKS
BANKS
THE_DEVELOPMENT
THE_DEVELOPMENT; THE_DEVELOPMENTS