Spaces:

ibm-granite
/

granite-vision-demo

Running on Zero

App Files Files Community

RTE Build commited on Mar 11

Commit

a099612

0 Parent(s):

Deployment

Browse files

Files changed (44) hide show

.gitattributes +37 -0
.gitignore +179 -0
.gitlint +143 -0
.pre-commit-config.yaml +51 -0
DEVELOPMENT.md +179 -0
README.md +41 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_20_0.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_3_0.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_7_0.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_7_1.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_7_2.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_0.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_1.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_2.png +3 -0
data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_3.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_16_0.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_16_1.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_16_2.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_16_3.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_17_0.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_17_1.png +3 -0
data/final_v2_mar04/images/wihlborgs/images/image_17_2.png +3 -0
data/final_v2_mar04/milvus/.milvus.db.lock +0 -0
data/final_v2_mar04/milvus/milvus.db +3 -0
data/final_v2_mar04/pdfs/IBM_Annual_Report_2007_3-20.pdf +3 -0
data/final_v2_mar04/pdfs/wihlborgs-2-13_16-18.pdf +3 -0
data/final_v2_mar04/preview/IBM-Z.png +3 -0
data/final_v2_mar04/preview/IBM-financial-2010.png +3 -0
data/final_v2_mar04/preview/Wilhlborg-financial.png +3 -0
poetry.lock +0 -0
pyproject.toml +62 -0
requirements.txt +101 -0
src/README.md +14 -0
src/app.css +39 -0
src/app_head.html +12 -0
src/qa_app.py +331 -0
src/rag_app.py +275 -0
src/sandbox/light_rag/credits.txt +4 -0
src/sandbox/light_rag/hf_embedding.py +38 -0
src/sandbox/light_rag/hf_llm.py +24 -0
src/sandbox/light_rag/light_rag.py +168 -0
src/sandbox/light_rag/utils.py +46 -0
src/themes/carbon.py +147 -0
src/themes/research_monochrome.py +152 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,37 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+data/**/* filter=lfs diff=lfs merge=lfs -text
+*.png filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,179 @@

+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# UV
+#   Similar to Pipfile.lock, it is generally recommended to include uv.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#uv.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/latest/usage/project/#working-with-version-control
+.pdm.toml
+.pdm-python
+.pdm-build/
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
+# Boilerplate specific ignores
+.gradio/
+.ruff_cache/
+## own igonres
+/src/app_text.py
+/.idea/
+/nbs/

.gitlint ADDED Viewed

	@@ -0,0 +1,143 @@

+# Edit this file as you like.
+#
+# All these sections are optional. Each section with the exception of [general] represents
+# one rule and each key in it is an option for that specific rule.
+#
+# Rules and sections can be referenced by their full name or by id. For example
+# section "[body-max-line-length]" could also be written as "[B1]". Full section names are
+# used in here for clarity.
+#
+# [general]
+# Ignore certain rules, this example uses both full name and id
+# ignore=title-trailing-punctuation, T3
+[general]
+# You HAVE to add the rule here to enable it, only configuring (such as below)
+# does NOT enable it.
+contrib=contrib-title-conventional-commits
+[contrib-title-conventional-commits]
+# Specify allowed commit types. For details see: https://www.conventionalcommits.org/
+types = build,chore,ci,docs,feat,fix,perf,refactor,revert,style,test
+# verbosity should be a value between 1 and 3, the commandline -v flags take precedence over this
+# verbosity = 2
+# By default gitlint will ignore merge, revert, fixup and squash commits.
+# ignore-merge-commits=true
+# ignore-revert-commits=true
+# ignore-fixup-commits=true
+# ignore-squash-commits=true
+# Ignore any data send to gitlint via stdin
+# ignore-stdin=true
+# Fetch additional meta-data from the local repository when manually passing a
+# commit message to gitlint via stdin or --commit-msg. Disabled by default.
+# staged=true
+# Hard fail when the target commit range is empty. Note that gitlint will
+# already fail by default on invalid commit ranges. This option is specifically
+# to tell gitlint to fail on *valid but empty* commit ranges.
+# Disabled by default.
+# fail-without-commits=true
+# Enable debug mode (prints more output). Disabled by default.
+# debug=true
+# Enable community contributed rules
+# See http://jorisroovers.github.io/gitlint/contrib_rules for details
+# contrib=contrib-title-conventional-commits,CC1
+# Set the extra-path where gitlint will search for user defined rules
+# See http://jorisroovers.github.io/gitlint/user_defined_rules for details
+# extra-path=examples/
+# This is an example of how to configure the "title-max-length" rule and
+# set the line-length it enforces to 50
+# [title-max-length]
+# line-length=50
+# Conversely, you can also enforce minimal length of a title with the
+# "title-min-length" rule:
+# [title-min-length]
+# min-length=5
+# [title-must-not-contain-word]
+# Comma-separated list of words that should not occur in the title. Matching is case
+# insensitive. It's fine if the keyword occurs as part of a larger word (so "WIPING"
+# will not cause a violation, but "WIP: my title" will.
+# words=wip
+# [title-match-regex]
+# python-style regex that the commit-msg title must match
+# Note that the regex can contradict with other rules if not used correctly
+# (e.g. title-must-not-contain-word).
+# regex=^US[0-9]*
+# [body-max-line-length]
+# line-length=72
+# [body-min-length]
+# min-length=5
+# [body-is-missing]
+# Whether to ignore this rule on merge commits (which typically only have a title)
+# default = True
+# ignore-merge-commits=false
+# [body-changed-file-mention]
+# List of files that need to be explicitly mentioned in the body when they are changed
+# This is useful for when developers often erroneously edit certain files or git submodules.
+# By specifying this rule, developers can only change the file when they explicitly reference
+# it in the commit message.
+# files=gitlint-core/gitlint/rules.py,README.md
+# [body-match-regex]
+# python-style regex that the commit-msg body must match.
+# E.g. body must end in My-Commit-Tag: foo
+# regex=My-Commit-Tag: foo$
+# [author-valid-email]
+# python-style regex that the commit author email address must match.
+# For example, use the following regex if you only want to allow email addresses from foo.com
+# regex=[^@]+@foo.com
+# [ignore-by-title]
+# Ignore certain rules for commits of which the title matches a regex
+# E.g. Match commit titles that start with "Release"
+# regex=^Release(.*)
+# Ignore certain rules, you can reference them by their id or by their full name
+# Use 'all' to ignore all rules
+# ignore=T1,body-min-length
+# [ignore-by-body]
+# Ignore certain rules for commits of which the body has a line that matches a regex
+# E.g. Match bodies that have a line that that contain "release"
+# regex=(.*)release(.*)
+#
+# Ignore certain rules, you can reference them by their id or by their full name
+# Use 'all' to ignore all rules
+# ignore=T1,body-min-length
+# [ignore-body-lines]
+# Ignore certain lines in a commit body that match a regex.
+# E.g. Ignore all lines that start with 'Co-Authored-By'
+# regex=^Co-Authored-By
+# [ignore-by-author-name]
+# Ignore certain rules for commits of which the author name matches a regex
+# E.g. Match commits made by dependabot
+# regex=(.*)dependabot(.*)
+#
+# Ignore certain rules, you can reference them by their id or by their full name
+# Use 'all' to ignore all rules
+# ignore=T1,body-min-length
+# This is a contrib rule - a community contributed rule. These are disabled by default.
+# You need to explicitly enable them one-by-one by adding them to the "contrib" option
+# under [general] section above.
+# [contrib-title-conventional-commits]
+# Specify allowed commit types. For details see: https://www.conventionalcommits.org/
+# types = bugfix,user-story,epic

.pre-commit-config.yaml ADDED Viewed

	@@ -0,0 +1,51 @@

+repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v5.0.0
+    hooks:
+      - id: check-added-large-files
+      - id: check-ast
+      - id: check-case-conflict
+      - id: check-json
+      - id: check-merge-conflict
+      - id: check-toml
+      - id: end-of-file-fixer
+  - repo: https://github.com/astral-sh/ruff-pre-commit
+    # Ruff version.
+    rev: v0.8.6
+    hooks:
+      - id: ruff
+  - repo: https://github.com/pycqa/isort
+    rev: 5.13.2
+    hooks:
+      - id: isort
+        args: ["--profile", "black"]
+  - repo: https://github.com/asottile/pyupgrade
+    rev: v3.19.1
+    hooks:
+      - id: pyupgrade
+        args: ["--py310-plus"]
+  - repo: https://github.com/psf/black
+    rev: 24.10.0
+    hooks:
+      - id: black
+        args:
+          - --line-length=120
+  - repo: https://github.com/jorisroovers/gitlint
+    rev:  v0.19.1
+    hooks:
+    -   id: gitlint
+        name: gitlint
+        language: python
+        entry: gitlint
+        args: [--staged, --msg-filename]
+        stages: [commit-msg]
+  - repo: https://github.com/python-poetry/poetry
+    rev: '1.8.0'
+    hooks:
+      - id: poetry-check
+      - id: poetry-lock
+        args: [--no-update]
+        language_version: "3.10"
+      - id: poetry-export
+        name: poetry export for base requirements
+        args: [-f, requirements.txt, -o, requirements.txt, -n, --only=main, --without-hashes]

DEVELOPMENT.md ADDED Viewed

	@@ -0,0 +1,179 @@

+# IBM Research Hugging Face Spaces gradio template
+This template repository lets you quickly build a [gradio](https://www.gradio.app/) Hugging Face spaces demo for the [ibm-granite org](https://huggingface.co/ibm-granite). It is set up with the requirements, theming and analytics for the ibm-granite org as well as pre-commit hooks and linting configuration to maintain a consistent code standard across all demos.
+## 👩‍💻 Introduction
+To deploy demos to the ibm-granite org on Hugging Face, you will be working with the Research Design Technical Experiences (RDTE) team via this GitHub org. You will not gain access to the ibm-granite Hugging Face org as there are limited seats available. Hence, you will work via the RDTE team (who have write access) to create and deploy demos to Hugging Face.
+## 🛠️ Getting started
+This is the place to start when building gradio demos for IBM Granite. Complete the following steps to get a repository set up and configured for your demo as well as the deployment pipeline to validate and push it to Hugging Face spaces.
+1. [Raise an onboarding request](https://github.ibm.com/ibm-huggingface-space-demos/deployment/issues/new?assignees=james-sutton,gwhite&labels=onboarding%2Ctriage&projects=&template=onboarding.yaml&title=%5BOnboarding%5D%3A+). Please fill the templated onboarding request to get a new repository set up for you in this org and to give access to anything else required.
+2. Once your repository has been created, please either update it with your existing demo if you have one, or have a play with the example and modify it to create your new demo. You'll be working in the `main` branch whilst developing your demo. Your `main` branch is linked to the "QA" instance of your demo in the IBM org on Hugging Face.
+3. Make sure that you follow this development guide and use the pre-configured pre-commit hooks before every commit and push.
+4. Once you are happy with your demo and want to get it deployed into production on Hugging Face spaces in the ibm-granite org, open a pull request to merge the `main` branch into the `stable` branch. The RDTE team will validate the demo works well both from a technical and UX standpoint. If your demo needs any custom environment variables or secrets, let the RDTE team know and we will contact you directly to get them added to the Space configuration on Hugging Face.
+5. Once the Pull request has been approved, you can merge it into the `stable` branch. A deployment will then push your changes to Hugging Face spaces where it will build and become available for use. Initially, both the "QA" and "Production" versions of your demo will be marked as private and only visible to members of the ibm-research org (QA) and ibm-granite org (production) that have logged into Hugging Face. The "QA" version will always remain private in the ibm-research org. However, when the RDTE team are happy to publish the demo to stable, they will mark the "Production" version as public in the ibm-granite org.
+### Onboarding Process Summary
+The following diagram explains the onboarding process. Actions that you, the developer, take are shown in darker blue. Actions that we, the RDTE team, take are shown in lighter blue. The lighter blue steps that have darker borders are automations maintained by the RDTE team, these steps require no manual intervention.
+```mermaid
+flowchart TD
+    1[Developer opens onboarding ticket in GHE Org]:::developer-->2
+    2{RDTE team review the request}:::rdte--Request returned with comments-->1
+    2--Approved-->3
+    3[Developer is invited to join the ibm-research org on HF]:::rdte-->4
+    4[New git repository created from template and configured]:::rdte-->5
+    5[QA HF space created in IBM org]:::rdte-->6
+    6[Developers push commits to main branch]:::developer-->7
+    7-->6
+    7[Main branch deployed to QA space in ibm-granite org on HF]:::rdteauto-->8
+    8[Developers open/update PR to merge main branch to stable branch]:::developer-->9
+    9{PR review}:::rdte--PR Approved-->10
+    9--Changes requested-->6
+    10{Prod space exists?}:::rdte-- Yes -->12
+    10-- No -->11
+    11[Prod HF space created in ibm-granite org]:::rdte-->12
+    12[Merge PR]:::developer-->13
+    13[Stable branch deployed to prod space in ibm-granite org on HF]:::rdteauto
+    classDef rdte fill:#EDF5FF,stroke:#D0E2FF,color:#000;
+    classDef rdteauto fill:#EDF5FF,stroke:#78A9FF,color:#000;
+    classDef developer fill:#A6C8FF,stroke:#78A9FF,color:#000;
+```
+## 🛠️ Development guide
+Further information on developing the code in this repository is provided below.
+### Clone your code repository
+Once you have been notified that your code repository has been created in this org, you can clone it to your local machine and start work.
+If you just want to play with our template, you're welcome to [use it](https://github.ibm.com/new?template_name=gradio-template&template_owner=ibm-huggingface-space-demos) to create a new code repository in another org. Later, for deployment, you wil need to move your code to the repository created in this org.
+### Prerequisites
+Some things you will need to do on your machine before developing.
+#### Precommit
+[Precommit](https://pre-commit.com) is a tool that adds git commit hooks. You will need to [install](https://pre-commit.com/#install) it on your machine and then run within your code repository:
+```shell
+pre-commit install
+```
+You can manually run pre-commit using the following command:
+```shell
+# To run against staged files:
+pre-commit run
+# If you want to run against staged and unstaged files:
+pre-commit run --all-files
+```
+It is important to run the pre-commit hooks and fix any files that fail before you commit and push to the repository as the pull request build will fail any PR that does not adhere to them i.e. the RDTE team will only accept your code for deployment to Hugging Face once it has passed all of the pre-commit checks.
+#### Poetry
+[Poetry](https://python-poetry.org/) is a tool for Python packaging, dependency and virtual environment management that is used to manage the development of this project. You will need to install Poetry locally. There are several ways to install it including through the package manager of your operating system, however, the easiest way to install is likely using their installer, as follows:
+```shell
+curl -sSL https://install.python-poetry.org | python3 -
+```
+You can also use `pip` and `pipx` to install poetry, the details of which are at https://python-poetry.org/docs/
+Once installed, the project is configured and controlled via the `pyproject.toml` file with the current dependency tree stored in `poetry.lock`. You may also [configure poetry](https://python-poetry.org/docs/configuration/) further if you wish but there is no need to do so as the default options are sufficient. You may, however, wish to change some of the options set in this template:
+| Setting | Notes |
+| ------- | ----- |
+| name | **Update this**, to reflect the name of your demo |
+| version | **Update this**, to reflect the current version of your demo |
+| description | **Update this**, to a short description of your demo |
+| authors | **Update this**, to the list of authors of your demo |
+## 🛠️ Install and run locally
+To get set up ready to run the code in development mode:
+```shell
+# add the poetry shell and export plugins (you only need to do this once on your machine)
+poetry self add poetry-plugin-shell
+poetry self add poetry-plugin-export
+# create and activate a python virtual environment
+poetry shell
+poetry install
+# run the demo locally (for development with automatic reload)
+gradio src/app.py
+```
+## 📝 Documenting your demo
+If you would like to write some information/documentation about your demo that is intended for developers or other people that might want to run the demo from scratch, please use the [README.md](README.md) file, leaving the Hugging Face Spaces configuration header in place at the top of the file.
+### Hugging face spaces configuration settings
+Hugging Face allow the configuration of spaces demonstrations via the [README.md](README.md) file in the root of the project. There is a [Spaces Configuration Reference](https://huggingface.co/docs/hub/en/spaces-config-reference) guide that you can use to gain an understanding of the configuration options that can be specified here.
+The template has a set of initial defaults, similar to these:
+```
+---
+title: Granite 3.0 Chat
+colorFrom: blue
+colorTo: indigo
+sdk: gradio
+sdk_version: 5.9.1
+app_file: src/app.py
+pinned: false
+license: apache-2.0
+short_description: Chat with IBM Granite 3.0
+---
+```
+#### Options
+The default options specified above:
+| Setting | Notes |
+| ------- | ----- |
+| title | **Update this**, keep this short (recommend max 24 chars), this information is displayed in the centre of the demo description card |
+| emoji | Do not update this, our demos will use a consistent emoji character |
+| colorFrom | Do not update this, used in combination with colorTo to colourize the demo description card |
+| colorTo | see colorFrom |
+| sdk | Do not update this, our Gradio demos will always use the "gradio" setting |
+| sdk_version | Update this if necessary for your demo to function, ideally should be set to the latest gradio version |
+| app_file | Update this if necessary for your demo to function, should be set to the path of the main entry point to the demo |
+| license | Do not update this, our demos are to always be apache-2.0 licensed |
+| short_description | **Update this**, should be set to a few words that describe the demo in a little more detail than the title, this information is displayed in the bottom-right of the demo description card |
+Other available options:
+| Setting | Notes |
+| ------- | ----- |
+| python_version | You may optionally set this, best advice is to use the default Python version if possible (current default is Python 3.10) |
+| suggested_hardware | Do not use this, unlikely to be required as demos run on ZeroGPU |
+| suggested_storage | Do not use this, our demos do not require storage |
+| app_port | Do not use this, not relevant for gradio demos |
+| base_path | Do not use this, use the app_file setting |
+| fullWidth | Do not use this, our demos will use a consistent default width |
+| header | Do not use this, our demos will use a consistent header |
+| models | Do not use this, let their parsing discover these from our code |
+| datasets | Do not use this, let their parsing discover these from our code |
+| tags | Do not use this, we are not tagging our demos |
+| thumbnail | Do not use this, provides a thumbnail for social sharing of demos |
+| pinned | Do not use this, the RDTE team will change this setting if it's deemed necessary |
+| hf_oauth | Do not use this, we are not using OAuth |
+| hf_oauth_scopes | Do not use this, we are not using OAuth |
+| hf_oauth_expiration_minutes | Do not use this, we are not using OAuth |
+| disable_embedding | Do not use this, leave at the default that allows embedding to take place |
+| startup_duration_timeout | Do not use this, leave at the default 30 minutes |
+| custom_headers | Do not use this, we do not need to add any custom HTTP headers |
+| preload_from_hub | Do not use this, specifying this builds the models and data sets into the container image with the goal of making start up times faster due to not needing to download them each time. However, RDTE testing indicates this setting significantly increases the start up time for our relatively small Granite models |

README.md ADDED Viewed

	@@ -0,0 +1,41 @@

+---
+title: Multimodal RAG with Granite Vision
+short_description: RAG example using Granite [vision, embedding, instruct]
+colorFrom: blue
+colorTo: indigo
+sdk: gradio
+sdk_version: 5.16.1
+app_file: src/rag_app.py
+pinned: False
+license: apache-2.0
+---
+# Granite Vision Demos
+## Install
+(copied from DEVELOP.md)
+```shell
+# add the poetry shell and export plugins (you only need to do this once on your machine)
+poetry self add poetry-plugin-shell
+poetry self add poetry-plugin-export
+# create and activate a python virtual environment
+poetry shell
+poetry install
+```
+## Run Demos
+### RAG
+Run with lazy loading models:
+```
+LAZY_LOADING=true gradio src/rag_app.py
+```
+### QA
+```
+gradio src/qa_app.py
+```

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_20_0.png ADDED Viewed

Git LFS Details

SHA256: 985dee55a5b0af267bb85889552e5b7ec5d8d5da804ee41b634a14dfe4bf0efb
Pointer size: 131 Bytes
Size of remote file: 855 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_3_0.png ADDED Viewed

Git LFS Details

SHA256: e92f65236228cae69616b6061154aa9f2098f29d91e0fb3359e5069f435a5703
Pointer size: 131 Bytes
Size of remote file: 535 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_7_0.png ADDED Viewed

Git LFS Details

SHA256: 8d027f1913bf06566e6bd9410fa3b03036867d01c73f88862839cf517eaa3894
Pointer size: 131 Bytes
Size of remote file: 254 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_7_1.png ADDED Viewed

Git LFS Details

SHA256: a13bb521e7f181b83c85b2cbb38847ea61ee69d3392d8591a639e75563855381
Pointer size: 131 Bytes
Size of remote file: 229 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_7_2.png ADDED Viewed

Git LFS Details

SHA256: 7a7cd973417093075c7066c5865d6cbb02e590cd6a654f63518867a465aeaab0
Pointer size: 132 Bytes
Size of remote file: 1.03 MB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_0.png ADDED Viewed

Git LFS Details

SHA256: 2f77e5fc5d1071173df145f2b6dcdee85d45d7e19d4e3a207cbc516c3a3691a0
Pointer size: 131 Bytes
Size of remote file: 270 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_1.png ADDED Viewed

Git LFS Details

SHA256: 253e65a514d72156bb90ce8b7fe40df3b88d5389921cf9434b0ee6094493d74d
Pointer size: 131 Bytes
Size of remote file: 169 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_2.png ADDED Viewed

Git LFS Details

SHA256: 49180360e894006245806bd504adef342f308e4b513e8b78d0849b10e8c1c0fb
Pointer size: 131 Bytes
Size of remote file: 312 kB

data/final_v2_mar04/images/ibm_report_2007/images/IBM_Annual_Report_2007_0-20_im_image_8_3.png ADDED Viewed

Git LFS Details

SHA256: ab33e6c5c6761eb4519a341facc8c40086d85803c09757bc10cc2aea71c8401e
Pointer size: 131 Bytes
Size of remote file: 213 kB

data/final_v2_mar04/images/wihlborgs/images/image_16_0.png ADDED Viewed

Git LFS Details

SHA256: cb9ba6222cc9c098a9a213c355c0f4b3a6f33f2b529de2b2f88fd5c1b72fffaf
Pointer size: 130 Bytes
Size of remote file: 33 kB

data/final_v2_mar04/images/wihlborgs/images/image_16_1.png ADDED Viewed

Git LFS Details

SHA256: 1623a516ba7abddc922c623baa5724e1528508d3ce11f552e3d2149e70258968
Pointer size: 130 Bytes
Size of remote file: 35.2 kB

data/final_v2_mar04/images/wihlborgs/images/image_16_2.png ADDED Viewed

Git LFS Details

SHA256: 27972cafcb60943edcd323a833f1d364ec2fba6c9f90fe0f4908fc60dba80709
Pointer size: 130 Bytes
Size of remote file: 40.3 kB

data/final_v2_mar04/images/wihlborgs/images/image_16_3.png ADDED Viewed

Git LFS Details

SHA256: 851717f397031eda475c4686e358cd5d03317ef2b5b6577f83027a0746626c55
Pointer size: 130 Bytes
Size of remote file: 36 kB

data/final_v2_mar04/images/wihlborgs/images/image_17_0.png ADDED Viewed

Git LFS Details

SHA256: 63e41e42b36c0762fe87bb664f18337549b28f9da81b3578a450933d97632544
Pointer size: 130 Bytes
Size of remote file: 29.7 kB

data/final_v2_mar04/images/wihlborgs/images/image_17_1.png ADDED Viewed

Git LFS Details

SHA256: e2c8a9eb0b2a88b48884dfe5dc50d1f65c8b288a6cf39138cfddaff7cc4acbcb
Pointer size: 130 Bytes
Size of remote file: 28.5 kB

data/final_v2_mar04/images/wihlborgs/images/image_17_2.png ADDED Viewed

Git LFS Details

SHA256: 413fac047292786046e1eaf9ce713c786f98c9215aeff8ccabb3a1761628873e
Pointer size: 130 Bytes
Size of remote file: 34.6 kB

data/final_v2_mar04/milvus/.milvus.db.lock ADDED Viewed

File without changes

data/final_v2_mar04/milvus/milvus.db ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e08ba08b5adbee90a02d7e02961d4b9f124cc5cc0281eaa93e594f3f033391f9
+size 475136

data/final_v2_mar04/pdfs/IBM_Annual_Report_2007_3-20.pdf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:496db869d12b0a31f00c872c1d9f6840500a6677221c51a362e9b1943062e7f9
+size 988484

data/final_v2_mar04/pdfs/wihlborgs-2-13_16-18.pdf ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:487233ff87278df209c8bb4400048f43ba85ab10ccabd75905c362e55b797ddf
+size 800249

data/final_v2_mar04/preview/IBM-Z.png ADDED Viewed

Git LFS Details

SHA256: 1ab646a5521525ff45865262fb83b4715c535b2d0545f384768af487853ff1a7
Pointer size: 131 Bytes
Size of remote file: 740 kB

data/final_v2_mar04/preview/IBM-financial-2010.png ADDED Viewed

Git LFS Details

SHA256: bab2d4c12a1cb8535748cd06a474ebb2a1fc74cece7da25a26ea24ef71dc0791
Pointer size: 131 Bytes
Size of remote file: 273 kB

data/final_v2_mar04/preview/Wilhlborg-financial.png ADDED Viewed

Git LFS Details

SHA256: 1b869ff930815b09809501853c0c0428da693fb69790a30cccacff09e9e257e9
Pointer size: 131 Bytes
Size of remote file: 448 kB

poetry.lock ADDED Viewed

The diff for this file is too large to render. See raw diff

pyproject.toml ADDED Viewed

	@@ -0,0 +1,62 @@

+[tool.poetry]
+name = "granite-vision-demos"
+version = "0.1.0"
+description = "A collection of gradio demos for granite vision models."
+authors = ["Hendrik Strobelt <hendrik.strobelt@ibm.com>"]
+license = "Apache-2.0"
+readme = "README.md"
+package-mode = false
+[tool.poetry.dependencies]
+python = ">=3.10,<3.11"
+gradio = "5.16.1"
+torch = "2.4.0"
+spaces = "0.30.4"
+transformers = { git = "https://github.com/huggingface/transformers" }
+accelerate = "^1.2.1"
+langchain-milvus = "^0.1.8"
+langchain-core = "^0.3.36"
+langchain-huggingface = "^0.1.2"
+gradio-pdf = "^0.0.22"
+[tool.poetry.group.dev.dependencies]
+pre-commit = "^4.0.1"
+git-lint = "^0.1.2"
+#ruff = "^0.8.3"
+ruff = "^0.9.3"
+pytest = "^8.3.4"
+[build-system]
+requires = ["poetry-core"]
+build-backend = "poetry.core.masonry.api"
+[tool.ruff]
+select = [
+    "E", # pycodestyle
+    "F", # pyflakes
+    "UP", # pyupgrade
+    "D", # pydocstyle
+    "I", # isort
+    "B", # bugbear
+    "ANN", # annotations
+    "N", # pep8-naming
+    "C4", # Comprehensions
+    "DTZ", # DatetimeZ
+    "Q", # Quotes
+    "SIM", # Simplify
+    "RUF", # Ruff
+]
+ignore = ["D203", "D213"]
+fixable = ["ALL"]
+unfixable = []
+line-length = 120
+[tool.black]
+line-length = 120
+[tool.ruff.lint.pydocstyle]
+convention = "google"

requirements.txt ADDED Viewed

	@@ -0,0 +1,101 @@

+accelerate==1.2.1 ; python_version >= "3.10" and python_version < "3.11"
+aiofiles==23.2.1 ; python_version >= "3.10" and python_version < "3.11"
+annotated-types==0.7.0 ; python_version >= "3.10" and python_version < "3.11"
+anyio==4.8.0 ; python_version >= "3.10" and python_version < "3.11"
+certifi==2024.12.14 ; python_version >= "3.10" and python_version < "3.11"
+cffi==1.17.1 ; python_version >= "3.10" and python_version < "3.11" and platform_python_implementation == "PyPy"
+charset-normalizer==3.4.1 ; python_version >= "3.10" and python_version < "3.11"
+click==8.1.8 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+colorama==0.4.6 ; python_version >= "3.10" and python_version < "3.11" and platform_system == "Windows"
+exceptiongroup==1.2.2 ; python_version >= "3.10" and python_version < "3.11"
+fastapi==0.115.6 ; python_version >= "3.10" and python_version < "3.11"
+ffmpy==0.5.0 ; python_version >= "3.10" and python_version < "3.11"
+filelock==3.16.1 ; python_version >= "3.10" and python_version < "3.11"
+fsspec==2024.12.0 ; python_version >= "3.10" and python_version < "3.11"
+gradio-client==1.7.0 ; python_version >= "3.10" and python_version < "3.11"
+gradio-pdf==0.0.22 ; python_version >= "3.10" and python_version < "3.11"
+gradio==5.16.1 ; python_version >= "3.10" and python_version < "3.11"
+grpcio==1.67.1 ; python_version >= "3.10" and python_version < "3.11"
+h11==0.14.0 ; python_version >= "3.10" and python_version < "3.11"
+httpcore==1.0.7 ; python_version >= "3.10" and python_version < "3.11"
+httpx==0.28.1 ; python_version >= "3.10" and python_version < "3.11"
+huggingface-hub==0.28.1 ; python_version >= "3.10" and python_version < "3.11"
+idna==3.10 ; python_version >= "3.10" and python_version < "3.11"
+jinja2==3.1.5 ; python_version >= "3.10" and python_version < "3.11"
+joblib==1.4.2 ; python_version >= "3.10" and python_version < "3.11"
+jsonpatch==1.33 ; python_version >= "3.10" and python_version < "3.11"
+jsonpointer==3.0.0 ; python_version >= "3.10" and python_version < "3.11"
+langchain-core==0.3.36 ; python_version >= "3.10" and python_version < "3.11"
+langchain-huggingface==0.1.2 ; python_version >= "3.10" and python_version < "3.11"
+langchain-milvus==0.1.8 ; python_version >= "3.10" and python_version < "3.11"
+langsmith==0.3.8 ; python_version >= "3.10" and python_version < "3.11"
+markdown-it-py==3.0.0 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+markupsafe==2.1.5 ; python_version >= "3.10" and python_version < "3.11"
+mdurl==0.1.2 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+milvus-lite==2.4.11 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "win32"
+mpmath==1.3.0 ; python_version >= "3.10" and python_version < "3.11"
+networkx==3.4.2 ; python_version >= "3.10" and python_version < "3.11"
+numpy==2.2.1 ; python_version >= "3.10" and python_version < "3.11"
+nvidia-cublas-cu12==12.1.3.1 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cuda-cupti-cu12==12.1.105 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cuda-nvrtc-cu12==12.1.105 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cuda-runtime-cu12==12.1.105 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cudnn-cu12==9.1.0.70 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cufft-cu12==11.0.2.54 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-curand-cu12==10.3.2.106 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cusolver-cu12==11.4.5.107 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-cusparse-cu12==12.1.0.106 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-nccl-cu12==2.20.5 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-nvjitlink-cu12==12.6.85 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+nvidia-nvtx-cu12==12.1.105 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version >= "3.10" and python_version < "3.11"
+orjson==3.10.13 ; python_version >= "3.10" and python_version < "3.11"
+packaging==24.2 ; python_version >= "3.10" and python_version < "3.11"
+pandas==2.2.3 ; python_version >= "3.10" and python_version < "3.11"
+pillow==11.1.0 ; python_version >= "3.10" and python_version < "3.11"
+protobuf==5.29.3 ; python_version >= "3.10" and python_version < "3.11"
+psutil==5.9.8 ; python_version >= "3.10" and python_version < "3.11"
+pycparser==2.22 ; python_version >= "3.10" and python_version < "3.11" and platform_python_implementation == "PyPy"
+pydantic-core==2.27.2 ; python_version >= "3.10" and python_version < "3.11"
+pydantic==2.10.4 ; python_version >= "3.10" and python_version < "3.11"
+pydub==0.25.1 ; python_version >= "3.10" and python_version < "3.11"
+pygments==2.19.1 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+pymilvus==2.5.4 ; python_version >= "3.10" and python_version < "3.11"
+python-dateutil==2.9.0.post0 ; python_version >= "3.10" and python_version < "3.11"
+python-dotenv==1.0.1 ; python_version >= "3.10" and python_version < "3.11"
+python-multipart==0.0.20 ; python_version >= "3.10" and python_version < "3.11"
+pytz==2024.2 ; python_version >= "3.10" and python_version < "3.11"
+pyyaml==6.0.2 ; python_version >= "3.10" and python_version < "3.11"
+regex==2024.11.6 ; python_version >= "3.10" and python_version < "3.11"
+requests-toolbelt==1.0.0 ; python_version >= "3.10" and python_version < "3.11"
+requests==2.32.3 ; python_version >= "3.10" and python_version < "3.11"
+rich==13.9.4 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+ruff==0.9.6 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+safehttpx==0.1.6 ; python_version >= "3.10" and python_version < "3.11"
+safetensors==0.5.1 ; python_version >= "3.10" and python_version < "3.11"
+scikit-learn==1.6.1 ; python_version >= "3.10" and python_version < "3.11"
+scipy==1.15.2 ; python_version >= "3.10" and python_version < "3.11"
+semantic-version==2.10.0 ; python_version >= "3.10" and python_version < "3.11"
+sentence-transformers==3.4.1 ; python_version >= "3.10" and python_version < "3.11"
+setuptools==75.8.0 ; python_version >= "3.10" and python_version < "3.11"
+shellingham==1.5.4 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+six==1.17.0 ; python_version >= "3.10" and python_version < "3.11"
+sniffio==1.3.1 ; python_version >= "3.10" and python_version < "3.11"
+spaces==0.30.4 ; python_version >= "3.10" and python_version < "3.11"
+starlette==0.41.3 ; python_version >= "3.10" and python_version < "3.11"
+sympy==1.13.3 ; python_version >= "3.10" and python_version < "3.11"
+tenacity==9.0.0 ; python_version >= "3.10" and python_version < "3.11"
+threadpoolctl==3.5.0 ; python_version >= "3.10" and python_version < "3.11"
+tokenizers==0.21.0 ; python_version >= "3.10" and python_version < "3.11"
+tomlkit==0.13.2 ; python_version >= "3.10" and python_version < "3.11"
+torch==2.4.0 ; python_version >= "3.10" and python_version < "3.11"
+tqdm==4.67.1 ; python_version >= "3.10" and python_version < "3.11"
+transformers @ git+https://github.com/huggingface/transformers@dd16acb8a3e93b643aa374c9fb80749f5235c1a6 ; python_version >= "3.10" and python_version < "3.11"
+triton==3.0.0 ; platform_system == "Linux" and platform_machine == "x86_64" and python_version < "3.11" and python_version >= "3.10"
+typer==0.15.1 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+typing-extensions==4.12.2 ; python_version >= "3.10" and python_version < "3.11"
+tzdata==2024.2 ; python_version >= "3.10" and python_version < "3.11"
+ujson==5.10.0 ; python_version >= "3.10" and python_version < "3.11"
+urllib3==2.3.0 ; python_version >= "3.10" and python_version < "3.11"
+uvicorn==0.34.0 ; python_version >= "3.10" and python_version < "3.11" and sys_platform != "emscripten"
+websockets==14.1 ; python_version >= "3.10" and python_version < "3.11"
+zstandard==0.23.0 ; python_version >= "3.10" and python_version < "3.11"

src/README.md ADDED Viewed

	@@ -0,0 +1,14 @@

+# Granite Vision Demos
+### RAG
+Run with lazy loading models:
+```
+LAZY_LOADING=true gradio src/rag_app.py
+```
+## QA
+```
+gradio src/qa_app.py
+```

src/app.css ADDED Viewed

	@@ -0,0 +1,39 @@

+footer {
+    display: none !important;
+}
+.pdf_viewer .top-panel{
+    display: none !important;
+}
+.chatbot_view .top-panel {
+    display: none !important;
+}
+.jumping-dots span {
+  position: relative;
+  bottom: 0px;
+  animation: jump 2s infinite;
+}
+.jumping-dots .dot-1{
+  animation-delay: 200ms;
+}
+.jumping-dots .dot-2{
+  animation-delay: 400ms;
+}
+.jumping-dots .dot-3{
+  animation-delay: 600ms;
+}
+@keyframes jump {
+  0%   {bottom: 0px;}
+  20%  {bottom: 5px;}
+  40%  {bottom: 0px;}
+}
+.inactive_div {
+    pointer-events: none;
+    opacity: .5;
+}
+/*.gallery-container .grid-container {*/
+/*        width: 50px;*/
+/*}*/

src/app_head.html ADDED Viewed

	@@ -0,0 +1,12 @@

+<script
+  async
+  src="https://www.googletagmanager.com/gtag/js?id=G-C6LFT227RC"
+></script>
+<script>
+  window.dataLayer = window.dataLayer || [];
+  function gtag() {
+    dataLayer.push(arguments);
+  }
+  gtag("js", new Date());
+  gtag("config", "G-C6LFT227RC");
+</script>

src/qa_app.py ADDED Viewed

	@@ -0,0 +1,331 @@

+"""Template Demo for IBM Granite Hugging Face spaces."""
+from collections.abc import Iterator
+from datetime import datetime
+from pathlib import Path
+from threading import Thread
+import gradio as gr
+import PIL
+import spaces
+import torch
+from PIL.Image import Image as PILImage
+from PIL.Image import Resampling
+from transformers import (
+    AutoModelForCausalLM,
+    AutoModelForVision2Seq,
+    AutoProcessor,
+    AutoTokenizer,
+    LlavaNextForConditionalGeneration,
+    LlavaNextProcessor,
+    TextIteratorStreamer,
+)
+from themes.research_monochrome import theme
+dir_ = Path(__file__).parent.parent
+today_date = datetime.today().strftime("%B %-d, %Y")  # noqa: DTZ002
+MODEL_ID = "ibm-granite/granite-vision-3.2-2b"
+MODEL_ID_PREVIEW = "ibm-granite/granite-vision-3.1-2b-preview"
+# SYS_PROMPT = f"""Knowledge Cutoff Date: April 2024.
+# Today's Date: {today_date}.
+# You are Granite, developed by IBM. You are a helpful AI assistant"""
+TITLE = "IBM Granite VISION 3.1 2b preview"
+DESCRIPTION = "Try one of the sample prompts below or write your own. Remember, \
+               AI models can make mistakes."
+MAX_INPUT_TOKEN_LENGTH = 4096
+MAX_NEW_TOKENS = 1024
+TEMPERATURE = 0.7
+TOP_P = 0.85
+TOP_K = 50
+REPETITION_PENALTY = 1.05
+sample_data = [
+    [
+        "https://www.ibm.com/design/language/static/159e89b3d8d6efcb5db43f543df36b23/a5df1/rebusgallery_tshirt.png",
+        ["What are the three symbols on the tshirt?"],
+    ],
+    [
+        str(dir_ / "data" / "p2-report.png"),
+        [
+            "What's the difference in rental income between 2020 and 2019?",
+            "Which table entries are less in 2020 than 2019?",
+        ],
+    ],
+    [
+        "https://www.ibm.com/design/language/static/159e89b3d8d6efcb5db43f543df36b23/a5df1/rebusgallery_tshirt.png",
+        ["What's this?"],
+    ],
+]
+device = torch.device("cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu")
+processor: LlavaNextProcessor = None
+model: LlavaNextForConditionalGeneration = None
+selected_image: PILImage = None
+def image_changed(im: PILImage):
+    global selected_image
+    if im is None:
+        selected_image = None
+    else:
+        selected_image = im.copy()
+        selected_image.thumbnail((800, 800))
+        # return selected_image
+def create_single_turn(image: PILImage, text: str) -> dict:
+    if image is None:
+        return {
+            "role": "user",
+            "content": [
+                {"type": "text", "text": text},
+            ],
+        }
+    else:
+        return {
+            "role": "user",
+            "content": [
+                {"type": "image", "image": image},
+                {"type": "text", "text": text},
+            ],
+        }
+@spaces.GPU
+def generate(
+    image: PILImage,
+    message: str,
+    chat_history: list[dict],
+    temperature: float = TEMPERATURE,
+    repetition_penalty: float = REPETITION_PENALTY,
+    top_p: float = TOP_P,
+    top_k: float = TOP_K,
+    max_new_tokens: int = MAX_NEW_TOKENS,
+):
+    """Generate function for chat demo.
+    Args:
+        max_new_tokens:
+        top_k:
+        top_p:
+        repetition_penalty:
+        temperature:
+        image: the image to be talked about...
+        message (str): The latest input message from the user.
+        chat_history (list[dict]): A list of dictionaries representing previous chat history, where each dictionary
+                                   contains 'role' and 'content'.
+    Yields:
+        str: The generated response, broken down into smaller chunks.
+    """
+    print(top_p)
+    # Build messages
+    conversation = []
+    #  TODO: maybe add back custom sys prompt
+    # conversation.append({"role": "system", "content": SYS_PROMPT})
+    conversation += chat_history
+    conversation.append(create_single_turn(image, message))
+    # Convert messages to prompt format
+    inputs = processor.apply_chat_template(
+        conversation, add_generation_prompt=True, tokenize=True, return_dict=True, return_tensors="pt"
+    ).to(device)
+    # TODO: This might cut out the image tokens -- find better strategy
+    # if input_ids.shape[1] > MAX_INPUT_TOKEN_LENGTH:
+    #     input_ids = input_ids[:, -MAX_INPUT_TOKEN_LENGTH:]
+    #     gr.Warning(f"Trimmed input from conversation as it was longer than {MAX_INPUT_TOKEN_LENGTH} tokens.")
+    generate_kwargs = dict(
+        max_new_tokens=max_new_tokens,
+        do_sample=True,
+        top_p=top_p,
+        top_k=top_k,
+        temperature=temperature,
+        num_beams=1,
+        repetition_penalty=repetition_penalty,
+    )
+    output = model.generate(**inputs, **generate_kwargs)
+    out = processor.decode(output[0], skip_special_tokens=True)
+    out_s = out.strip().split("<|assistant|>")
+    return [gr.ChatMessage(role="user", content=message), gr.ChatMessage(role="assistant", content=out_s[-1])]
+def multimodal_generate_v2(
+    msg: str,
+    temperature: float = TEMPERATURE,
+    repetition_penalty: float = REPETITION_PENALTY,
+    top_p: float = TOP_P,
+    top_k: float = TOP_K,
+    max_new_tokens: int = MAX_NEW_TOKENS,
+):
+    global model, processor
+    # lazy loading and adding image
+    if model is None:
+        processor = AutoProcessor.from_pretrained(MODEL_ID)
+        model = AutoModelForVision2Seq.from_pretrained(MODEL_ID, device_map="auto").to(device)
+    return generate(
+        selected_image,
+        msg,
+        [],
+        temperature=temperature,
+        repetition_penalty=repetition_penalty,
+        top_p=top_p,
+        top_k=top_k,
+        max_new_tokens=max_new_tokens,
+    )
+tb = gr.Textbox(submit_btn=True)
+# advanced settings (displayed in Accordion)
+temperature_slider = gr.Slider(
+    minimum=0,
+    maximum=1.0,
+    value=TEMPERATURE,
+    step=0.1,
+    label="Temperature",
+    elem_classes=["gr_accordion_element"],
+    interactive=True,
+)
+top_p_slider = gr.Slider(
+    minimum=0,
+    maximum=1.0,
+    value=TOP_P,
+    step=0.05,
+    label="Top P",
+    elem_classes=["gr_accordion_element"],
+    interactive=True,
+)
+top_k_slider = gr.Slider(
+    minimum=0, maximum=100, value=TOP_K, step=1, label="Top K", elem_classes=["gr_accordion_element"], interactive=True
+)
+repetition_penalty_slider = gr.Slider(
+    minimum=0,
+    maximum=2.0,
+    value=REPETITION_PENALTY,
+    step=0.05,
+    label="Repetition Penalty",
+    elem_classes=["gr_accordion_element"],
+    interactive=True,
+)
+max_new_tokens_slider = gr.Slider(
+    minimum=1,
+    maximum=2000,
+    value=MAX_NEW_TOKENS,
+    step=1,
+    label="Max New Tokens",
+    elem_classes=["gr_accordion_element"],
+    interactive=True,
+)
+chatbot = gr.Chatbot(examples=[{"text": "Hello World!"}], type="messages", label="Q&A about selected document")
+css_file_path = Path(Path(__file__).parent / "app.css")
+head_file_path = Path(Path(__file__).parent / "app_head.html")
+with gr.Blocks(fill_height=True, css_paths=css_file_path, head_paths=head_file_path, theme=theme, title=TITLE) as demo:
+    is_in_edit_mode = gr.State(True)  # in block to be reactive
+    gr.Markdown(f"# {TITLE}")
+    gr.Markdown(DESCRIPTION)
+    with gr.Row():
+        with gr.Column():
+            # create sample image object for reference, render later
+            image_x = gr.Image(
+                type="pil",
+                label="Example image",
+                render=False,
+                interactive=False,
+                show_label=False,
+                show_fullscreen_button=False,
+                height=800,
+            )
+            image_x.change(fn=image_changed, inputs=image_x)
+            # Create Dataset object and render it
+            ds = gr.Dataset(label="Select one document", samples=sample_data, components=[gr.Image(render=False)])
+            def sample_image_selected(d: gr.SelectData, dx):
+                return gr.Image(dx[0]), gr.update(examples=[{"text": x} for x in dx[1]])
+            ds.select(lambda: [], outputs=[chatbot])
+            ds.select(sample_image_selected, inputs=[ds], outputs=[image_x, chatbot])
+            # Render image object after DS
+            image_x.render()
+        with gr.Column():
+            # Render ChatBot
+            chatbot.render()
+            # Define behavior for example selection
+            def update_user_chat_x(x: gr.SelectData):
+                return [gr.ChatMessage(role="user", content=x.value["text"])]
+            def send_generate_x(x: gr.SelectData, temperature, repetition_penalty, top_p, top_k, max_new_tokens):
+                txt = x.value["text"]
+                return multimodal_generate_v2(txt, temperature, repetition_penalty, top_p, top_k, max_new_tokens)
+            chatbot.example_select(lambda: False, outputs=is_in_edit_mode)
+            chatbot.example_select(update_user_chat_x, outputs=[chatbot])
+            chatbot.example_select(
+                send_generate_x,
+                inputs=[
+                    temperature_slider,
+                    repetition_penalty_slider,
+                    top_p_slider,
+                    top_k_slider,
+                    max_new_tokens_slider,
+                ],
+                outputs=[chatbot],
+            )
+            # Create User Chat Textbox and Reset Button
+            tbb = gr.Textbox(submit_btn=True, show_label=False)
+            fb = gr.Button("Reset Chat", visible=False)
+            fb.click(lambda: [], outputs=[chatbot])
+            # Handle toggling betwwen edit and non-edit mode
+            def textbox_switch(emode):
+                # if t.visible:
+                if not emode:
+                    return [gr.update(visible=False), gr.update(visible=True)]
+                else:
+                    return [gr.update(visible=True), gr.update(visible=False)]
+            tbb.submit(lambda: False, outputs=[is_in_edit_mode])
+            fb.click(lambda: True, outputs=[is_in_edit_mode])
+            is_in_edit_mode.change(textbox_switch, inputs=[is_in_edit_mode], outputs=[tbb, fb])
+            # submit user question
+            tbb.submit(lambda x: [gr.ChatMessage(role="user", content=x)], inputs=tbb, outputs=chatbot)
+            tbb.submit(
+                multimodal_generate_v2,
+                inputs=[
+                    tbb,
+                    temperature_slider,
+                    repetition_penalty_slider,
+                    top_p_slider,
+                    top_k_slider,
+                    max_new_tokens_slider,
+                ],
+                outputs=[chatbot],
+            )
+            # extra model parameters
+            with gr.Accordion("Advanced Settings", open=False):
+                max_new_tokens_slider.render()
+                temperature_slider.render()
+                top_k_slider.render()
+                top_p_slider.render()
+                repetition_penalty_slider.render()
+if __name__ == "__main__":
+    demo.queue(max_size=20).launch()

src/rag_app.py ADDED Viewed

	@@ -0,0 +1,275 @@

+"""Template Demo for IBM Granite Hugging Face spaces."""
+import os
+import time
+from pathlib import Path
+import re
+import gradio as gr
+import spaces
+import torch
+from gradio_pdf import PDF
+from sandbox.light_rag.light_rag import LightRAG
+from themes.research_monochrome import theme
+dir_ = Path(__file__).parent.parent
+TITLE = "Multimodal RAG with Granite Vision 3.2"
+DESCRIPTION = """
+<p>This experimental demo highlights granite-vision-3.2-2b capabilities within a multimodal retrieval-augmented generation (RAG) pipeline, demonstrating Granite's document understanding in real-world applications. Explore the sample document excerpts and try the sample prompts or enter your own. Keep in mind that AI can occasionally make mistakes.
+<span class="gr_docs_link">
+<a href="https://www.ibm.com/granite/docs/models/vision/">View Documentation <i class="fa fa-external-link"></i></a>
+</span>
+</p>
+"""
+device = torch.device("cuda" if torch.cuda.is_available() else "mps" if torch.backends.mps.is_available() else "cpu")
+BASE_PATH = dir_ / "data" / "final_v2_mar04"
+PDFS_PATH = BASE_PATH / "pdfs"
+MILVUS_PATH = BASE_PATH / "milvus"
+IMAGES_PATH = BASE_PATH / "images"
+PREVIEWS_PATH = BASE_PATH / "preview"
+sample_data = [
+    {
+        "preview_image": str(PREVIEWS_PATH / "IBM-financial-2010.png"),
+        "prompts": """Where geographically was the greatest growth in revenue in 2007?
+Which year had the highest income in billion?
+Did the net income decrease in 2007 compared to 2006?
+Net cash from operations on 2005?
+What does it mean to be Globally Integrated Enterprise?
+What are the segments for pretax income?""".split("\n"),
+        "pdf": str(PDFS_PATH / "IBM_Annual_Report_2007_3-20.pdf"),
+        "index": "ibm_report_2007_short_text_milvus_lite_2048_128_slate_278m_cosine",
+        "db": str(MILVUS_PATH / "milvus.db"),
+        "name": "IBM annual report 2007",
+        "origin": "https://www.ibm.com/investor/att/pdf/IBM_Annual_Report_2007.pdf",
+        "image_paths": {"prefix": str(IMAGES_PATH / "ibm_report_2007") + "/", "use_last": 2},
+    },
+    {
+        "preview_image": str(PREVIEWS_PATH / "Wilhlborg-financial.png"),
+        "prompts": """Where does Wihlborgs mainly operate?
+Which year had the second lowest Equity/assets ratio?
+Which year had the highest Project investments value?
+What is the trend of equity/assets ratio?
+What was the Growth percentage in income from property management in 2020?
+Has the company’s interest coverage ratio increased or decreased in recent years?""".split("\n")
+        ,
+        "pdf": str(PDFS_PATH / "wihlborgs-2-13_16-18.pdf"),
+        "index": "wihlborgs_short_text_milvus_lite_2048_128_slate_278m_cosine",
+        "db": str(MILVUS_PATH / "milvus.db"),
+        "name": "Wihlborgs Report 2020",
+        "origin": "https://www.wihlborgs.se/globalassets/investor-relations/rapporter/2021/20210401-wihlborgs-annual-report-and-sustainability-report-2020-c24a6b51-c124-44fc-a4af-4237a33a29fb.pdf",
+        "image_paths": {"prefix": str(IMAGES_PATH / "wihlborgs") + "/", "use_last": 2},
+    },
+]
+config = {
+    "embedding_model_id": "ibm-granite/granite-embedding-278m-multilingual",
+    "generation_model_id": "ibm-granite/granite-3.1-8b-instruct",
+    "milvus_collection_name": "granite_vision_tech_report_text_milvus_lite_512_128_slate_125m_cosine",
+    "milvus_db_path": str(dir_ / "data" / MILVUS_PATH / "milvus_text_sample.db"),
+}
+if gr.NO_RELOAD:
+    light_rag: LightRAG = LightRAG(config)
+    if not os.environ.get("LAZY_LOADING") == "true":
+        for sample in sample_data:
+            light_rag.precache_milvus(sample["index"], sample["db"])
+def lower_md_headers(md: str) -> str:
+    return re.sub(r'(?:^|\n)##?\s(.+)', lambda m: '\n### ' + m.group(1), md)
+# Parser for retrival results
+def format_retrieval_result(i, d, cb, selected_sample):
+    image_paths = sample_data[selected_sample]["image_paths"]
+    if d.metadata["type"] == "text":
+        context_string = f"---\n## Context {i + 1}\n#### (text extracted from document)\n{lower_md_headers(d.page_content)}\n"
+        cb.append(gr.ChatMessage(role="assistant", content=context_string))
+        return True
+    elif d.metadata["type"] == "image_description":
+        context_string = f"---\n## Context {i + 1}\n#### (image description generated by Granite Vision)"
+        cb.append(gr.ChatMessage(role="assistant", content=context_string))
+        # /dccstor/mm-rag/idanfr/granite_vision_demo/wdu_output/IBM_Annual_Report_2007/images/IBM_Annual_Report_2007_im_image_7_1.png
+        image_path_parts = d.metadata["image_fullpath"].split("/")
+        image_path = image_paths["prefix"] + ("/".join(image_path_parts[-image_paths["use_last"]:]))
+        # print(f"image_path: {image_path}")
+        cb.append(gr.ChatMessage(role="assistant", content=gr.Image(image_path)))
+        cb.append(gr.ChatMessage(role="assistant", content=f"\n{lower_md_headers(d.metadata['image_description'])}\n"))
+chatbot = gr.Chatbot(
+    examples=[{"text": x} for x in sample_data[0]["prompts"]],
+    type="messages",
+    label=f"Q&A about {sample_data[0]['name']}",
+    height=685,
+    group_consecutive_messages=True,
+    autoscroll=False,
+    elem_classes=["chatbot_view"],
+)
+@spaces.GPU()
+def generate_with_llm(query, context):
+    if os.environ.get("NO_LLM"):
+        time.sleep(2)
+        return "Now answer, just a string", query
+    return light_rag.generate(query=query, context=context)
+# TODO: maybe add GPU back ?
+def retrieval(collection, db, q):
+    return light_rag.search(q, top_n=3, collection=collection, db=db)
+# ################
+# User Interface
+# ################
+css_file_path = Path(Path(__file__).parent / "app.css")
+head_file_path = Path(Path(__file__).parent / "app_head.html")
+with gr.Blocks(fill_height=True, css_paths=css_file_path, head_paths=head_file_path, theme=theme, title=TITLE) as demo:
+    is_in_edit_mode = gr.State(True)  # in block to be reactive
+    selected_doc = gr.State(0)
+    current_question = gr.State("")
+    gr.Markdown(f"# {TITLE}")
+    gr.Markdown(DESCRIPTION)
+    with gr.Row():
+        # LEFT COLUMN: Sample selection, download, and PDF viewer
+        with gr.Column():
+            # Show preview images
+            images_only = [sd["preview_image"] for sd in sample_data]
+            document_gallery = gr.Gallery(
+                images_only,
+                label="Select a document",
+                rows=1,
+                columns=3,
+                height="125px",
+                # width="125px",
+                allow_preview=False,
+                selected_index=0,
+                elem_classes=["preview_im_element"],
+            )
+            with gr.Group():
+                pdf_display = PDF(
+                    sample_data[0]["pdf"],
+                    label=f"Preview for {sample_data[0]['name']}",
+                    height=460,
+                    interactive=False,
+                    elem_classes=["pdf_viewer"],
+                )
+                dl_btn = gr.DownloadButton(
+                    label=f"Download PDF ({sample_data[0]['name']})", value=sample_data[0]["pdf"], visible=True
+                )
+            def sample_image_selected(d: gr.SelectData):
+                dx = sample_data[d.index]
+                # print(f"DX:{dx}")
+                return (
+                    gr.update(examples=[{"text": x} for x in dx["prompts"]], label=f"Q&A about {dx['name']}"),
+                    gr.update(value=dx["pdf"], label=f"Preview for {dx['name']}"),
+                    gr.DownloadButton(value=dx["pdf"], label=f"Download PDF ({dx['name']})"),
+                    d.index
+                )
+            document_gallery.select(lambda: [], outputs=[chatbot])
+            document_gallery.select(sample_image_selected, inputs=[],
+                                    outputs=[chatbot, pdf_display, dl_btn, selected_doc])
+        # Right Column: Chat interface
+        with gr.Column():
+            # Render ChatBot
+            chatbot.render()
+            # Define behavior for example selection
+            def update_user_chat_x(x: gr.SelectData):
+                return [gr.ChatMessage(role="user", content=x.value["text"])]
+            def question_from_selection(x: gr.SelectData):
+                return x.value["text"]
+            def _decorate_yield_result(cb, fb_status=False, gallery_status=False):
+                return cb, gr.Button(interactive=fb_status), gr.Gallery(
+                    elem_classes=["preview_im_element"] if gallery_status else ["preview_im_element", "inactive_div"])
+            def send_generate(msg, cb, selected_sample):
+                collection = sample_data[selected_sample]["index"]
+                db = sample_data[selected_sample]["db"]
+                # print(f"collection: {collection}, {db}")
+                original_msg = gr.ChatMessage(role="user", content=msg)
+                cb.append(original_msg)
+                waiting_for_retrieval_msg = gr.ChatMessage(role="assistant",
+                                                           content='## Answer\n*Querying Index*<span class="jumping-dots"><span class="dot-1">.</span>  <span class="dot-2">.</span>  <span class="dot-3">.</span></span>')
+                cb.append(waiting_for_retrieval_msg)
+                yield _decorate_yield_result(cb)
+                q = msg.strip()
+                results = retrieval(collection, db, q)
+                # for d in results:
+                #     print(f"****\n{d}")
+                context_string = "## Context Documents for Answer\n\n"
+                for i, d in enumerate(results):
+                    if format_retrieval_result(i, d, cb, selected_sample):
+                        yield _decorate_yield_result(cb)
+                waiting_for_llm_msg = gr.ChatMessage(role="assistant",
+                                                     content='## Answer\n *Waiting for LLM* <span class="jumping-dots"><span class="dot-1">.</span>  <span class="dot-2">.</span>  <span class="dot-3">.</span></span> ')
+                cb[1] = waiting_for_llm_msg
+                yield _decorate_yield_result(cb)
+                answer, prompt = generate_with_llm(q, results)
+                cb[1] = gr.ChatMessage(role="assistant", content=f"## Answer\n<b>{answer.strip()}</b>")
+                # cb.pop()
+                # cb.append(gr.ChatMessage(role="assistant", content=f"## Answer\n<b>{answer.strip()}</b>"))
+                yield _decorate_yield_result(cb, fb_status=True, gallery_status=True)
+            # Create User Chat Textbox and Reset Button
+            tbb = gr.Textbox(submit_btn=True, show_label=False, placeholder="Type a message...")
+            fb = gr.Button("Ask new question", visible=False)
+            fb.click(lambda: [], outputs=[chatbot])
+            chatbot.example_select(lambda: False, outputs=is_in_edit_mode)
+            # chatbot.example_select(update_user_chat_x, outputs=[chatbot])
+            chatbot.example_select(question_from_selection, inputs=[], outputs=[current_question]
+                                   ).then(send_generate, inputs=[current_question, chatbot, selected_doc],
+                                          outputs=[chatbot, fb, document_gallery])
+            def textbox_switch(e_mode):  # Handle toggling between edit and non-edit mode
+                if not e_mode:
+                    return [gr.update(visible=False), gr.update(visible=True)]
+                else:
+                    return [gr.update(visible=True), gr.update(visible=False)]
+            tbb.submit(lambda: False, outputs=[is_in_edit_mode])
+            fb.click(lambda: True, outputs=[is_in_edit_mode])
+            is_in_edit_mode.change(textbox_switch, inputs=[is_in_edit_mode], outputs=[tbb, fb])
+            # submit user question
+            # tbb.submit(lambda x: [gr.ChatMessage(role="user", content=x)], inputs=tbb, outputs=chatbot)
+            tbb.submit(lambda x: x, inputs=[tbb], outputs=[current_question]
+                       ).then(send_generate,
+                              inputs=[current_question, chatbot, selected_doc],
+                              outputs=[chatbot, fb, document_gallery])
+if __name__ == "__main__":
+    # demo.queue(max_size=20).launch()
+    demo.launch()

src/sandbox/light_rag/credits.txt ADDED Viewed

	@@ -0,0 +1,4 @@

+Light RAG code is adapted from work by:
+Idan Friedmann (IBM)
+Roi Pony (IBM)
+Adi Raz Goldfarb (IBM)

src/sandbox/light_rag/hf_embedding.py ADDED Viewed

	@@ -0,0 +1,38 @@

+from typing import List
+from langchain_huggingface import HuggingFaceEmbeddings
+from sandbox.light_rag.utils import get_device
+class HFEmbedding:
+    def __init__(
+            self,
+            model_id: str,
+    ):
+        device = get_device()
+        # TODO: hack for zeroGPU
+        device = "cpu"
+        print(f"Using device: {device}")
+        if device == "cpu":
+            print("Using CPU might be too slow")
+        self.model_name = model_id
+        print(f"Loading embeddings model from: {self.model_name}")
+        self.embeddings_service = HuggingFaceEmbeddings(
+            model_name=self.model_name,
+            model_kwargs={"device": device},
+        )
+    def embed_batch(self, batch: list[str]):
+        return self.embeddings_service.embed_documents(batch)
+    def embed_documents(self, texts: list[str]) -> list[list[float]]:
+        embeddings = self.embeddings_service.embed_documents(texts)
+        return embeddings
+    def embed_query(self, text: str) -> list[float]:
+        return self.embed_documents([text])[0]

src/sandbox/light_rag/hf_llm.py ADDED Viewed

	@@ -0,0 +1,24 @@

+from transformers import AutoModelForCausalLM, AutoTokenizer
+from sandbox.light_rag.utils import get_device
+class HFLLM:
+    def __init__(self, model_name: str):
+        self.device = get_device()
+        self.model_name = model_name
+        print("Loading HF model...")
+        # Load the tokenizer and model from Hugging Face
+        self.tokenizer = AutoTokenizer.from_pretrained(model_name)
+        self.model = AutoModelForCausalLM.from_pretrained(model_name).to(self.device)
+    def generate(self, prompt: str) -> list:
+        # tokenize the text
+        model_inputs = self.tokenizer(prompt, return_tensors="pt").to(self.device)
+        generated_ids = self.model.generate(**model_inputs, max_new_tokens=1024)
+        generated_texts = self.tokenizer.batch_decode(generated_ids, skip_special_tokens=False)
+        # print(f"gen txt: {generated_texts}")
+        response = [{"answer": generated_texts[0].split("<|end_of_role|>")[-1].split("<|end_of_text|>")[0]}]
+        return response

src/sandbox/light_rag/light_rag.py ADDED Viewed

	@@ -0,0 +1,168 @@

+import logging
+import os
+from typing import List
+from langchain_core.documents import Document
+from langchain_core.vectorstores import VectorStore
+from langchain_milvus import Milvus
+from sandbox.light_rag.hf_embedding import HFEmbedding
+from sandbox.light_rag.hf_llm import HFLLM
+context_template = "Document:\n{document}\n"
+token_limit = 4096
+logger = logging.getLogger()
+class LightRAG:
+    def __init__(self, config: dict):
+        self.config = config
+        lazy_loading = os.environ.get("LAZY_LOADING")
+        self.gen_model = None if lazy_loading else HFLLM(config['generation_model_id'])
+        self._embedding_model = None if lazy_loading else HFEmbedding(config['embedding_model_id'])
+        # self._vector_store = None
+        self._pre_cached_indices = {}
+        # now lazy:
+        # Milvus(
+        #     embedding_function=self._embedding_model,
+        #     collection_name=config['milvus_collection_name'].replace("-", "_"),
+        #     index_params={"metric_ttpe": "cosine".upper()},
+        #     # connection_args = ({"uri": "./milvus/text/milvus.db"})
+        #     connection_args = ({"uri": config['milvus_db_path']})
+        # )
+    def _get_embedding_model(self):
+        if self._embedding_model is None:
+            self._embedding_model = HFEmbedding(self.config['embedding_model_id'])
+        return self._embedding_model
+    def precache_milvus(self, collection, db):
+        # col_name = self.config["milvus_collection_name"] if collection is None else collection
+        # db = self.config["milvus_db_path"] if db is None else db
+        key = self._cache_key(collection, db)
+        self._pre_cached_indices[key] = Milvus(
+            embedding_function=self._get_embedding_model(),
+            collection_name=collection.replace("-", "_"),
+            index_params={"metric_ttpe": "cosine".upper()},
+            # connection_args = ({"uri": "./milvus/text/milvus.db"})
+            connection_args=({"uri": db}),
+        )
+    def _get_milvus_index(self, collection, db):
+        key = self._cache_key(collection, db)
+        if key in self._pre_cached_indices:
+            print(f"cache hit: {key}")
+            return self._pre_cached_indices[key]
+        else:
+            return Milvus(
+                embedding_function=self._get_embedding_model(),
+                collection_name=collection.replace("-", "_"),
+                index_params={"metric_ttpe": "cosine".upper()},
+                # connection_args = ({"uri": "./milvus/text/milvus.db"})
+                connection_args=({"uri": db}),
+            )
+    def search(self, query: str, top_n: int = 5, collection=None, db=None) -> list[Document]:
+        # if self._vector_store is None:
+        # TODO: be more clever :)
+        col_name = self.config["milvus_collection_name"] if collection is None else collection
+        db = self.config["milvus_db_path"] if db is None else db
+        # print(f"col_name: {col_name} on db: {db}")
+        vs = self._get_milvus_index(col_name, db)
+        # self._vector_store = Milvus(
+        #     embedding_function=self._get_embedding_model(),
+        #     collection_name=col_name.replace("-", "_"),
+        #     index_params={"metric_ttpe": "cosine".upper()},
+        #     # connection_args = ({"uri": "./milvus/text/milvus.db"})
+        #     connection_args=({"uri": db}),
+        # )
+        context = vs.similarity_search(
+            query=query,
+            k=100,
+        )
+        results = []
+        for d in context:
+            if d.metadata.get("type") == "text":  # and not ("Picture placeholder" in d.page_content):
+                results.append(d)
+            elif d.metadata.get("type") == "image_description":
+                if not any(r.metadata["document_id"] == d.metadata.get("document_id") for r in results):
+                    results.append(d)
+        top_n = min(top_n, len(results))
+        return results[:top_n]
+    def _build_prompt(self, question: str, context: List[Document]):
+        # Prepare documents:
+        text_documents = []
+        for doc in context:
+            if doc.metadata['type'] == 'text':
+                text_documents.append(doc.page_content.strip())
+            elif doc.metadata['type'] == 'image_description':
+                text_documents.append(doc.metadata['image_description'].strip())
+            else:
+                logger.warning('Should not get here!')
+        documents = [{"text": x} for x in text_documents]
+        prompt = self.gen_model.tokenizer.apply_chat_template(
+            conversation=[
+                {
+                    "role": "user",
+                    "content": question,
+                }
+            ],
+            documents=documents,  # This uses the documents support in the Granite chat template
+            add_generation_prompt=True,
+            tokenize=False,
+        )
+        return prompt
+    def generate(self, query, context=None):
+        if self.gen_model is None:
+            self.gen_model = HFLLM(self.config["generation_model_id"])
+        # build prompt
+        question = query
+        prompt = self._build_prompt(question, context)
+        # print(f"prompt: |||{prompt}|||")
+        # infer
+        results = self.gen_model.generate(prompt)
+        # print(f"results: {results}")
+        answer = results[0]["answer"]
+        return answer, prompt
+    def _cache_key(self, collection, db):
+        return collection + "___" + db
+# if __name__ == '__main__':
+# from dotenv import load_dotenv
+# load_dotenv()
+#
+# config = {
+#     "embedding_model_id": "ibm-granite/granite-embedding-125m-english",
+#     "generation_model_id": "ibm-granite/granite-3.1-8b-instruct",
+#     "milvus_collection_name": "granite_vision_tech_report_text_milvus_lite_512_128_slate_125m_cosine",
+#     "milvus_db_path": "/dccstor/mm-rag/adi/code/RAGEval/milvus/text/milvus.db"
+# }
+#
+# rag_app = LightRAG(config)
+#
+# query = "What models are available in Watsonx?"
+#
+# # run retrieval
+# context = rag_app.search(query=query, top_n=5)
+# # generate answers
+# answer, prompt = rag_app.generate(query=query, context=context)
+#
+# print(f"Answer:\n{answer}")
+# print(f"Used prompt:\n{prompt}")
+# python -m debugpy --connect cccxl009.pok.ibm.com:3002 ./sandbox/light_rag/light_rag.py

src/sandbox/light_rag/utils.py ADDED Viewed

	@@ -0,0 +1,46 @@

+import logging
+import os
+import re
+from collections.abc import Sequence
+from datetime import datetime, timezone
+from pathlib import Path
+import torch
+import yaml
+def batchify(seq: Sequence, batch_size: int):
+    for i in range(0, len(seq), batch_size):
+        yield seq[i : i + batch_size]
+def get_device():
+    if torch.backends.mps.is_available():
+        return "mps"  # mac GPU
+    elif torch.cuda.is_available():
+        return "cuda"
+    else:
+        return "cpu"
+def init_logger():
+    logging.basicConfig(
+        level=logging.INFO,  # Set the logging level
+        format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",  # Define the log format
+    )
+def get_timestamp():
+    return datetime.now(timezone.utc).strftime("%Y_%m_%d-%H_%M_%S")
+TIMESTAMP_PATTERN = re.compile(r"^\d{4}_\d{2}_\d{2}-\d{2}_\d{2}_\d{2}$")
+def get_last_timestamp(path: Path):
+    if os.path.exists(path):
+        timestamps = [f for f in os.listdir(path) if TIMESTAMP_PATTERN.match(f)]
+        if len(timestamps) > 0:
+            return sorted(timestamps)[-1]
+    return None

src/themes/carbon.py ADDED Viewed

	@@ -0,0 +1,147 @@

+"""IBM Carbon theme for gradio demos.
+This version builds on top of the Carbon theme to make it more playful with rounded corners, a larger font family to
+enhance readability, and the IBM Cool Gray color palette for better consistency with other IBM Research demos, such as
+Bee.
+"""
+import gradio as gr
+from gradio.themes.utils import sizes
+theme = gr.themes.Base(
+    primary_hue=gr.themes.Color(
+        c100="#EDF5FF",
+        c200="#D0E2FF",
+        c300="#A6C8FF",
+        c400="#78A9FF",
+        c50="#F9F9FB",
+        c500="#4589FF",
+        c600="#0F62FE",
+        c700="#0043CE",
+        c800="#002D9C",
+        c900="#001D6C",
+        c950="#001141",
+    ),
+    secondary_hue=gr.themes.Color(
+        c100="#EDF5FF",
+        c200="#D0E2FF",
+        c300="#A6C8FF",
+        c400="#78A9FF",
+        c50="#F9F9FB",
+        c500="#4589FF",
+        c600="#0F62FE",
+        c700="#0043CE",
+        c800="#002D9C",
+        c900="#001D6C",
+        c950="#001141",
+    ),
+    neutral_hue=gr.themes.Color(
+        c100="#F2F4F8",
+        c200="#DDE1E6",
+        c300="#C1C7CD",
+        c400="#A2A9B0",
+        c50="#F9F9FB",
+        c500="#878D96",
+        c600="#697077",
+        c700="#4D5358",
+        c800="#393939",
+        c900="#21272A",
+        c950="#121619",
+    ),
+    spacing_size=sizes.spacing_md,  # change spacing to default size
+    radius_size=sizes.radius_md,  # change spacing to default size and Keep Radius to make demo feel more playful
+    text_size=sizes.text_lg,  # change fontsize to default size
+    #   spacing_size: sizes.Size | str = sizes.spacing_md,  #change spacing to default size
+    #         radius_size: sizes.Size | str = sizes.radius_md, #change spacing to default size and Keep Radius to make
+    #                                                           demo feel more playful
+    #         text_size: sizes.Size | str = sizes.text_lg, #change fontsize to default size
+    font=["IBM Plex Sans", "ui-sans-serif", "system-ui", "sans-serif"],  # update font
+    font_mono=["IBM Plex Mono", "ui-monospace", "Consolas", "monospace"],  # update font
+).set(
+    # Colors
+    background_fill_primary="*neutral_100",  # Coolgray10 background
+    background_fill_primary_dark="*neutral_950",  # Coolgray95 background for dark mode
+    slider_color="*primary_600",  # Blue60
+    slider_color_dark="*primary_500",  # Blue50
+    # Shadows
+    shadow_drop="0 1px 4px 0 rgb(0 0 0 / 0.1)",
+    shadow_drop_lg="0 2px 5px 0 rgb(0 0 0 / 0.1)",
+    # Block Labels
+    block_background_fill="white",
+    block_label_background_fill="white",  # same color as blockback gound fill
+    block_label_radius="*radius_md",
+    block_label_text_size="*text_md",
+    block_label_text_weight="600",
+    block_label_text_color="black",
+    block_label_text_color_dark="white",
+    block_title_radius="*block_label_radius",
+    block_title_background_fill="*block_label_background_fill",
+    block_title_text_weight="600",
+    block_title_text_color="black",
+    block_title_text_color_dark="white",
+    block_label_margin="*spacing_md",
+    # Inputs
+    input_background_fill="white",
+    input_background_fill_dark="*block-background-fill",
+    input_border_color="*neutral_100",
+    input_shadow="*shadow_drop",
+    input_shadow_focus="*shadow_drop_lg",
+    checkbox_shadow="none",
+    # Buttons
+    shadow_spread="6px",
+    button_primary_shadow="*shadow_drop_lg",
+    button_primary_shadow_hover="*shadow_drop_lg",
+    button_primary_shadow_active="*shadow_inset",
+    button_secondary_shadow="*shadow_drop_lg",
+    button_secondary_shadow_hover="*shadow_drop_lg",
+    button_secondary_shadow_active="*shadow_inset",
+    checkbox_label_shadow="*shadow_drop_lg",
+    button_primary_background_fill="*primary_600",
+    button_primary_background_fill_hover="*primary_500",
+    button_primary_background_fill_hover_dark="*primary_500",
+    button_primary_text_color="white",
+    button_secondary_background_fill="white",
+    button_secondary_background_fill_hover="*neutral_100",
+    button_secondary_background_fill_dark="*neutral_800",  # Secondary cool gray 80
+    button_secondary_background_fill_hover_dark="*primary_500",
+    button_secondary_text_color="*neutral_800",
+    button_cancel_background_fill="*button_secondary_background_fill",
+    button_cancel_background_fill_hover="*button_secondary_background_fill_hover",
+    button_cancel_background_fill_hover_dark="*button_secondary_background_fill_hover",
+    button_cancel_text_color="*button_secondary_text_color",
+    checkbox_label_background_fill_selected="*primary_200",
+    checkbox_label_background_fill_selected_dark="*primary_500",
+    checkbox_border_width="1px",
+    checkbox_border_color="*neutral_200",
+    checkbox_background_color_dark="*neutral_700",  # Jan 18 test to fix checkbox, radio button background color
+    checkbox_background_color_selected="*primary_600",
+    checkbox_background_color_selected_dark="*primary_500",
+    checkbox_border_color_focus="*primary_600",
+    checkbox_border_color_focus_dark="*primary_500",
+    checkbox_border_color_selected="*primary_600",
+    checkbox_border_color_selected_dark="*primary_500",
+    checkbox_label_text_color_selected="black",
+    # Borders
+    block_border_width="1px",  # test example border
+    panel_border_width="1px",
+    # Chatbubble related colors
+    # light
+    # color_accent = "*secondary_400",
+    border_color_accent_subdued="*color_accent_soft",  # chatbubble human border color, use Blue 20 as an accent color
+    color_accent_soft="*secondary_200",  # chatbubble human color
+    # darkmode
+    # chatbubble human border color in darkmode, use Blue 20 as an accent color
+    border_color_accent_subdued_dark="*secondary_500",
+    color_accent_soft_dark="*secondary_500",  # chatbubble human color in dark mode
+    # Chatbot related font
+    chatbot_text_size="*text_md",  # make it larger
+    # additional dark mode related tweaks:
+    # block_background_fill_dark="*neutral_950", # Jan 18 test coolgray95 background for dark mode
+    block_label_background_fill_dark="*neutral_800",  # same color as blockback gound fill
+    block_title_background_fill_dark="*block_label_background_fill",
+    # input_background_fill_dark="*neutral_800", #This attribute help match fill color cool gray 80 to match background
+    #                                             however cause the problem for the general theme.
+    #  input_shadow_dark="*shadow_drop", #Test if it could make the border without the color
+    # input_border_color_dark="*neutral_200",#add attribute for border Jan 18
+    checkbox_border_color_dark="*neutral_600",  # Jan 18 test to fix border
+)

src/themes/research_monochrome.py ADDED Viewed

	@@ -0,0 +1,152 @@

+"""IBM Research Monochrome theme for gradio demos.
+This version is a variation of CarbonSoft style, where the primary button is dark gray to create monochrome style. This
+version uses the style from Research demos such as Bee to make it more playful with rounded corners, a larger font
+family to enhance readability, and the IBM Cool Gray color palette for better consistency with other IBM Research demos,
+such as Bee.
+"""
+import gradio as gr
+from gradio.themes.utils import sizes
+theme = gr.themes.Base(
+    primary_hue=gr.themes.Color(
+        c100="#EDF5FF",
+        c200="#D0E2FF",
+        c300="#A6C8FF",
+        c400="#78A9FF",
+        c50="#F9F9FB",
+        c500="#4589FF",
+        c600="#0F62FE",
+        c700="#0043CE",
+        c800="#002D9C",
+        c900="#001D6C",
+        c950="#001141",
+    ),
+    secondary_hue=gr.themes.Color(
+        c100="#EDF5FF",
+        c200="#D0E2FF",
+        c300="#A6C8FF",
+        c400="#78A9FF",
+        c50="#F9F9FB",
+        c500="#4589FF",
+        c600="#0F62FE",
+        c700="#0043CE",
+        c800="#002D9C",
+        c900="#001D6C",
+        c950="#001141",
+    ),
+    neutral_hue=gr.themes.Color(
+        c100="#F2F4F8",
+        c200="#DDE1E6",
+        c300="#C1C7CD",
+        c400="#A2A9B0",
+        c50="#F9F9FB",
+        c500="#878D96",
+        c600="#697077",
+        c700="#4D5358",
+        c800="#393939",
+        c900="#21272A",
+        c950="#121619",
+    ),
+    spacing_size=sizes.spacing_md,  # change spacing to default size
+    radius_size=sizes.radius_md,  # change spacing to default size and Keep Radius to make demo feel more playful
+    text_size=sizes.text_md,  # change fontsize to default size
+    #   spacing_size: sizes.Size | str = sizes.spacing_md,  #change spacing to default size
+    #         radius_size: sizes.Size | str = sizes.radius_md, #change spacing to default size and Keep Radius to make
+    #                                                           demo feel more playful
+    #         text_size: sizes.Size | str = sizes.text_lg, #change fontsize to default size
+    font=["IBM Plex Sans", "ui-sans-serif", "system-ui", "sans-serif"],  # update font
+    font_mono=["IBM Plex Mono", "ui-monospace", "Consolas", "monospace"],  # update font
+).set(
+    # Colors
+    background_fill_primary="*neutral_100",  # Coolgray10 background
+    background_fill_primary_dark="*neutral_950",  # Coolgray95 background for dark mode
+    # Change blue to black to create monochrome style
+    slider_color="*neutral_900",
+    slider_color_dark="*primary_500",
+    # Shadows
+    shadow_drop="0 1px 4px 0 rgb(0 0 0 / 0.1)",
+    shadow_drop_lg="0 2px 5px 0 rgb(0 0 0 / 0.1)",
+    # Block Labels
+    block_background_fill="white",
+    block_label_background_fill="white",  # same color as blockback gound fill
+    block_label_radius="*radius_md",
+    block_label_text_size="*text_md",
+    block_label_text_weight="600",
+    block_label_text_color="black",
+    block_label_text_color_dark="white",
+    block_title_radius="*block_label_radius",
+    block_title_background_fill="*block_label_background_fill",
+    block_title_text_weight="400",
+    block_title_text_color="black",
+    block_title_text_color_dark="white",
+    block_label_margin="*spacing_md",
+    # Inputs
+    input_background_fill="white",
+    input_background_fill_dark="*block-background-fill",
+    input_border_color="*neutral_100",
+    input_shadow="*shadow_drop",
+    input_shadow_dark="0 1px 4px #000",
+    input_shadow_focus="*shadow_drop_lg",
+    checkbox_shadow="none",
+    # Buttons
+    shadow_spread="6px",
+    button_primary_shadow="*shadow_drop_lg",
+    button_primary_shadow_hover="*shadow_drop_lg",
+    button_primary_shadow_active="*shadow_inset",
+    button_secondary_shadow="*shadow_drop_lg",
+    button_secondary_shadow_hover="*shadow_drop_lg",
+    button_secondary_shadow_active="*shadow_inset",
+    checkbox_label_shadow="*shadow_drop_lg",
+    # Change blue to black to create monochrome style
+    button_primary_background_fill="*neutral_900",
+    button_primary_background_fill_dark="*neutral_600",
+    button_primary_background_fill_hover="*neutral_700",
+    button_primary_background_fill_hover_dark="*primary_500",  # hover to be blue
+    button_primary_text_color="white",
+    button_secondary_background_fill="white",
+    button_secondary_background_fill_hover="*neutral_100",
+    button_secondary_background_fill_dark="*neutral_800",  # Secondary cool gray 80
+    button_secondary_background_fill_hover_dark="*primary_500",
+    button_secondary_text_color="*neutral_800",
+    button_cancel_background_fill="*button_secondary_background_fill",
+    button_cancel_background_fill_hover="*button_secondary_background_fill_hover",
+    button_cancel_background_fill_hover_dark="*button_secondary_background_fill_hover",
+    button_cancel_text_color="*button_secondary_text_color",
+    checkbox_label_background_fill_selected="*primary_200",
+    checkbox_label_background_fill_selected_dark="*primary_500",
+    checkbox_border_width="1px",
+    checkbox_border_color="*neutral_200",
+    checkbox_background_color_dark="*neutral_700",  # Jan 18 test to fix checkbox, radio button background color
+    checkbox_background_color_selected="*primary_600",
+    checkbox_background_color_selected_dark="*primary_500",
+    checkbox_border_color_focus="*primary_600",
+    checkbox_border_color_focus_dark="*primary_500",
+    checkbox_border_color_selected="*primary_600",
+    checkbox_border_color_selected_dark="*primary_500",
+    checkbox_label_text_color_selected="black",
+    # Borders
+    block_border_width="1px",  # test example border
+    panel_border_width="1px",
+    # Chatbubble related colors
+    # light
+    # color_accent = "*secondary_400",
+    border_color_accent_subdued="*color_accent_soft",  # chatbubble human border color, use Blue 20 as an accent color
+    color_accent_soft="*secondary_200",  # chatbubble human color
+    # darkmode
+    # chatbubble human border color in darkmode, use Blue 20 as an accent color
+    border_color_accent_subdued_dark="*secondary_500",
+    color_accent_soft_dark="*secondary_500",  # chatbubble human color in dark mode
+    # Chatbot related font
+    chatbot_text_size="*text_md",  # make it larger
+    # additional dark mode related tweaks:
+    # block_background_fill_dark="*neutral_950", # Jan 18 test coolgray95 background for dark mode
+    block_label_background_fill_dark="*neutral_800",  # same color as blockback gound fill
+    block_title_background_fill_dark="*block_label_background_fill",
+    # input_background_fill_dark="*neutral_800", #This attribute help match fill color cool gray 80 to match background
+    #                                             however cause the problem for the general theme.
+    #  input_shadow_dark="*shadow_drop", #Test if it could make the border without the color
+    # input_border_color_dark="*neutral_200",#add attribute for border Jan 18
+    checkbox_border_color_dark="*neutral_600",  # Jan 18 test to fix border
+)