diff --git a/build/doctrees/environment.pickle b/build/doctrees/environment.pickle index 54726c44..af4fa9ce 100644 Binary files a/build/doctrees/environment.pickle and b/build/doctrees/environment.pickle differ diff --git a/build/doctrees/faq_link.doctree b/build/doctrees/faq_link.doctree index 8778afff..eb96cf91 100644 Binary files a/build/doctrees/faq_link.doctree and b/build/doctrees/faq_link.doctree differ diff --git a/build/doctrees/notebooks/DemoNotebook_ammico.doctree b/build/doctrees/notebooks/DemoNotebook_ammico.doctree index c996ee8a..e55111dd 100644 Binary files a/build/doctrees/notebooks/DemoNotebook_ammico.doctree and b/build/doctrees/notebooks/DemoNotebook_ammico.doctree differ diff --git a/build/doctrees/readme_link.doctree b/build/doctrees/readme_link.doctree index 4f0116b6..2050e025 100644 Binary files a/build/doctrees/readme_link.doctree and b/build/doctrees/readme_link.doctree differ diff --git a/build/html/.buildinfo b/build/html/.buildinfo index 52166454..ebf1f6bc 100644 --- a/build/html/.buildinfo +++ b/build/html/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: cfb548d3f0892cdaa09a4601a129febf +config: 9487e2edbbf95a60cd8fdb622afe617f tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/build/html/_static/documentation_options.js b/build/html/_static/documentation_options.js index d1f22919..033e08ef 100644 --- a/build/html/_static/documentation_options.js +++ b/build/html/_static/documentation_options.js @@ -1,5 +1,5 @@ const DOCUMENTATION_OPTIONS = { - VERSION: '0.0.1', + VERSION: '0.2.2', LANGUAGE: 'en', COLLAPSE_INDEX: false, BUILDER: 'html', diff --git a/build/html/ammico.html b/build/html/ammico.html index 9be207b0..433ccf61 100644 --- a/build/html/ammico.html +++ b/build/html/ammico.html @@ -6,14 +6,14 @@ - text module — AMMICO 0.0.1 documentation + text module — AMMICO 0.2.2 documentation - + @@ -228,7 +228,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/create_API_key_link.html b/build/html/create_API_key_link.html index e782159f..6bef995b 100644 --- a/build/html/create_API_key_link.html +++ b/build/html/create_API_key_link.html @@ -6,14 +6,14 @@ - Instructions how to generate and enable a google Cloud Vision API key — AMMICO 0.0.1 documentation + Instructions how to generate and enable a google Cloud Vision API key — AMMICO 0.2.2 documentation - + @@ -73,7 +73,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/faq_link.html b/build/html/faq_link.html index ed37d838..267809c0 100644 --- a/build/html/faq_link.html +++ b/build/html/faq_link.html @@ -6,14 +6,14 @@ - FAQ — AMMICO 0.0.1 documentation + FAQ — AMMICO 0.2.2 documentation - + @@ -87,7 +87,7 @@
  • - Edit on GitHub + Edit on GitHub

  • @@ -200,9 +200,9 @@

    What happens if I don’t have internet access - can I still use ammico?

    Why don’t I get probabilistic assessments of age, gender and race when running the Emotion Detector?

    Due to well documented biases in the detection of minorities with computer vision tools, and to the ethical implications of such detection, these parts of the tool are not directly made available to users. To access these capabilities, users must first agree with a ethical disclosure statement that reads:

    -

    “DeepFace and RetinaFace provide wrappers to trained models in face recognition and emotion detection. Age, gender and race/ethnicity models were trained on the backbone of VGG-Face with transfer learning. -ETHICAL DISCLOSURE STATEMENT: -The Emotion Detector uses DeepFace and RetinaFace to probabilistically assess the gender, age and race of the detected faces. Such assessments may not reflect how the individuals identify. Additionally, the classification is carried out in simplistic categories and contains only the most basic classes (for example, “male” and “female” for gender, and seven non-overlapping categories for ethnicity). To access these probabilistic assessments, you must therefore agree with the following statement: “I understand the ethical and privacy implications such assessments have for the interpretation of the results and that this analysis may result in personal and possibly sensitive data, and I wish to proceed.”

    +

    “DeepFace and RetinaFace provide wrappers to trained models in face recognition and emotion detection. Age, gender and race/ethnicity models were trained on the backbone of VGG-Face with transfer learning.

    +

    ETHICAL DISCLOSURE STATEMENT:

    +

    The Emotion Detector uses DeepFace and RetinaFace to probabilistically assess the gender, age and race of the detected faces. Such assessments may not reflect how the individuals identify. Additionally, the classification is carried out in simplistic categories and contains only the most basic classes (for example, “male” and “female” for gender, and seven non-overlapping categories for ethnicity). To access these probabilistic assessments, you must therefore agree with the following statement: “I understand the ethical and privacy implications such assessments have for the interpretation of the results and that this analysis may result in personal and possibly sensitive data, and I wish to proceed.”

    This disclosure statement is included as a separate line of code early in the flow of the Emotion Detector. Once the user has agreed with the statement, further data analyses will also include these assessments.

    diff --git a/build/html/genindex.html b/build/html/genindex.html index 6ce85806..8a0c17b8 100644 --- a/build/html/genindex.html +++ b/build/html/genindex.html @@ -5,14 +5,14 @@ - Index — AMMICO 0.0.1 documentation + Index — AMMICO 0.2.2 documentation - + @@ -70,7 +70,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/index.html b/build/html/index.html index f7c8eba4..047b0981 100644 --- a/build/html/index.html +++ b/build/html/index.html @@ -6,14 +6,14 @@ - Welcome to AMMICO’s documentation! — AMMICO 0.0.1 documentation + Welcome to AMMICO’s documentation! — AMMICO 0.2.2 documentation - + @@ -74,7 +74,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/license_link.html b/build/html/license_link.html index b0a73e2b..8842259c 100644 --- a/build/html/license_link.html +++ b/build/html/license_link.html @@ -6,14 +6,14 @@ - License — AMMICO 0.0.1 documentation + License — AMMICO 0.2.2 documentation - + @@ -72,7 +72,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/modules.html b/build/html/modules.html index fbb1c141..1bb3125e 100644 --- a/build/html/modules.html +++ b/build/html/modules.html @@ -6,14 +6,14 @@ - AMMICO package modules — AMMICO 0.0.1 documentation + AMMICO package modules — AMMICO 0.2.2 documentation - + @@ -83,7 +83,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/notebooks/DemoNotebook_ammico.html b/build/html/notebooks/DemoNotebook_ammico.html index d0782cd4..8fe40b6a 100644 --- a/build/html/notebooks/DemoNotebook_ammico.html +++ b/build/html/notebooks/DemoNotebook_ammico.html @@ -6,7 +6,7 @@ - AMMICO Demonstration Notebook — AMMICO 0.0.1 documentation + AMMICO Demonstration Notebook — AMMICO 0.2.2 documentation @@ -14,7 +14,7 @@ - + @@ -106,7 +106,7 @@
  • - Edit on GitHub + Edit on GitHub

  • @@ -523,7 +523,7 @@

    Read in a csv file containing text and translating/analysing the text

    The detector modules

    The different detector modules with their options are explained in more detail in this section. ## Text detector Text on the images can be extracted using the TextDetector class (text module). The text is initally extracted using the Google Cloud Vision API and then translated into English with googletrans. The translated text is cleaned of whitespace, linebreaks, and numbers using Python syntax and spaCy.

    -

    4627534faec74c6cb30013b3b78abb84

    +

    a481a91a1d8c4b57885989804c065f7e

    The user can set if the text should be further summarized, and analyzed for sentiment and named entity recognition, by setting the keyword analyse_text to True (the default is False). If set, the transformers pipeline is used for each of these tasks, with the default models as of 03/2023. Other models can be selected by setting the optional keyword model_names to a list of selected models, on for each task: model_names=["sshleifer/distilbart-cnn-12-6", "distilbert-base-uncased-finetuned-sst-2-english", "dbmdz/bert-large-cased-finetuned-conll03-english"] for summary, sentiment, and ner. To be even more specific, revision numbers can also be selected by specifying the optional keyword revision_numbers to a list of revision numbers for each model, for example revision_numbers=["a4f8f3e", "af0f99b", "f2482bf"].

    Please note that for the Google Cloud Vision API (the TextDetector class) you need to set a key in order to process the images. This key is ideally set as an environment variable using for example

    @@ -615,7 +615,7 @@

    The detector modules

    Image summary and query

    The SummaryDetector can be used to generate image captions (summary) as well as visual question answering (VQA).

    -

    89ab67ce3b0e471e8741cfc2b23d97f1

    +

    faf82562ce8a4cd4babda34fde71e01e

    This module is based on the LAVIS library. Since the models can be quite large, an initial object is created which will load the necessary models into RAM/VRAM and then use them in the analysis. The user can specify the type of analysis to be performed using the analysis_type keyword. Setting it to summary will generate a caption (summary), questions will prepare answers (VQA) to a list of questions as set by the user, summary_and_questions will do both. Note that the desired analysis type needs to be set here in the initialization of the detector object, and not when running the analysis for each image; the same holds true for the selected model.

    The implemented models are listed below.

    @@ -878,7 +878,7 @@

    BLIP2 models

    Detection of faces and facial expression analysis

    Faces and facial expressions are detected and analyzed using the EmotionDetector class from the faces module. Initially, it is detected if faces are present on the image using RetinaFace, followed by analysis if face masks are worn (Face-Mask-Detection). The probabilistic detection of age, gender, race, and emotions is carried out with deepface, but only if the disclosure statement has been accepted (see above).

    -

    08b5f56998844e20961d743a8d32ea91

    +

    412f8c74483b4718849ff5047d5b90df

    Depending on the features found on the image, the face detection module returns a different analysis content: If no faces are found on the image, all further steps are skipped and the result "face": "No", "multiple_faces": "No", "no_faces": 0, "wears_mask": ["No"], "age": [None], "gender": [None], "race": [None], "emotion": [None], "emotion (category)": [None] is returned. If one or several faces are found, up to three faces are analyzed if they are partially concealed by a face mask. If yes, only age and gender are detected; if no, also race, emotion, and dominant emotion are detected. In case of the latter, the output could look like this: "face": "Yes", "multiple_faces": "Yes", "no_faces": 2, "wears_mask": ["No", "No"], "age": [27, 28], "gender": ["Man", "Man"], "race": ["asian", None], "emotion": ["angry", "neutral"], "emotion (category)": ["Negative", "Neutral"], where for the two faces that are detected (given by no_faces), some of the values are returned as a list with the first item for the first (largest) face and the second item for the second (smaller) face (for example, "emotion" returns a list ["angry", "neutral"] signifying the first face expressing anger, and the second face having a neutral expression).

    diff --git a/build/html/notebooks/Example cropposts.html b/build/html/notebooks/Example cropposts.html index 201e0dda..69935eb2 100644 --- a/build/html/notebooks/Example cropposts.html +++ b/build/html/notebooks/Example cropposts.html @@ -6,7 +6,7 @@ - Crop posts module — AMMICO 0.0.1 documentation + Crop posts module — AMMICO 0.2.2 documentation @@ -14,7 +14,7 @@ - + @@ -76,7 +76,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/build/html/py-modindex.html b/build/html/py-modindex.html index 6445c5d1..772f90c8 100644 --- a/build/html/py-modindex.html +++ b/build/html/py-modindex.html @@ -5,14 +5,14 @@ - Python Module Index — AMMICO 0.0.1 documentation + Python Module Index — AMMICO 0.2.2 documentation - + diff --git a/build/html/readme_link.html b/build/html/readme_link.html index e462c0ed..b449d1b2 100644 --- a/build/html/readme_link.html +++ b/build/html/readme_link.html @@ -6,14 +6,14 @@ - AMMICO - AI Media and Misinformation Content Analysis Tool — AMMICO 0.0.1 documentation + AMMICO - AI Media and Misinformation Content Analysis Tool — AMMICO 0.2.2 documentation - + @@ -85,7 +85,7 @@
  • - Edit on GitHub + Edit on GitHub

  • @@ -147,25 +147,25 @@

    Installation
    pip install ammico
     
    -

    This will install the package and its dependencies locally. If after installation you get some errors when running some modules, please follow the instructions in the FAQ.

    +

    This will install the package and its dependencies locally. If after installation you get some errors when running some modules, please follow the instructions in the FAQ.

    Usage

    -

    The main demonstration notebook can be found in the notebooks folder and also on google colab: [Open In Colab].

    +

    The main demonstration notebook can be found in the notebooks folder and also on google colab: Open In Colab.

    There are further sample notebooks in the notebooks folder for the more experimental features:

    1. Topic analysis: Use the notebook get-text-from-image.ipynb to analyse the topics of the extraced text.
      -You can run this notebook on google colab: [Open In Colab
      +You can run this notebook on google colab: Open In Colab
      Place the data files and google cloud vision API key in your google drive to access the data.

    2. To crop social media posts use the cropposts.ipynb notebook. -You can run this notebook on google colab: [Open In Colab

    3. +You can run this notebook on google colab: Open In Colab

    Features

    Text extraction

    -

    The text is extracted from the images using google-cloud-vision. For this, you need an API key. Set up your google account following the instructions on the google Vision AI website or as described here. +

    The text is extracted from the images using google-cloud-vision. For this, you need an API key. Set up your google account following the instructions on the google Vision AI website or as described here. You then need to export the location of the API key as an environment variable:

    export GOOGLE_APPLICATION_CREDENTIALS="location of your .json"
     
    diff --git a/build/html/search.html b/build/html/search.html index 8ff80553..c8a516a4 100644 --- a/build/html/search.html +++ b/build/html/search.html @@ -5,7 +5,7 @@ - Search — AMMICO 0.0.1 documentation + Search — AMMICO 0.2.2 documentation @@ -13,7 +13,7 @@ - + diff --git a/build/html/set_up_credentials.html b/build/html/set_up_credentials.html index 2a9b6a39..7a546c9f 100644 --- a/build/html/set_up_credentials.html +++ b/build/html/set_up_credentials.html @@ -6,14 +6,14 @@ - Instructions how to generate and enable a google Cloud Vision API key — AMMICO 0.0.1 documentation + Instructions how to generate and enable a google Cloud Vision API key — AMMICO 0.2.2 documentation - + @@ -71,7 +71,7 @@
  • - Edit on GitHub + Edit on GitHub

  • diff --git a/source/conf.py b/source/conf.py index 047d47bb..c8d1d6bd 100644 --- a/source/conf.py +++ b/source/conf.py @@ -15,7 +15,7 @@ project = "AMMICO" copyright = "2022, Scientific Software Center, Heidelberg University" author = "Scientific Software Center, Heidelberg University" -release = "0.0.1" +release = "0.2.2" # -- General configuration --------------------------------------------------- # https://www.sphinx-doc.org/en/master/usage/configuration.html#general-configuration @@ -31,7 +31,7 @@ "github_user": "ssciwr", # Username "github_repo": "AMMICO", # Repo name "github_version": "main", # Version - "conf_py_path": "/source/", # Path in the checkout to the docs root + "conf_py_path": "/docs/source/", # Path in the checkout to the docs root } templates_path = ["_templates"]