Spaces:

broadwell
/

ma-images

Sleeping

App Files Files Community

broadwell commited on Aug 28

Commit

c3d8208

•

1 Parent(s): 3d8e28d

Don't run activations viz with ResNet model, to save memory

Browse files

Files changed (1) hide show

app.py +20 -7

app.py CHANGED Viewed

@@ -27,7 +27,7 @@ from CLIP_Explainability.vit_cam import (
 from pytorch_grad_cam.grad_cam import GradCAM
-RUN_LITE = False  # Load vision model for CAM viz explainability for M-CLIP only
 MAX_IMG_WIDTH = 500
 MAX_IMG_HEIGHT = 800
@@ -110,6 +110,10 @@ def clip_search(search_query):
 def string_search():
     if "search_field_value" in st.session_state:
         clip_search(st.session_state.search_field_value)
@@ -179,10 +183,9 @@ def init():
         ja_model_name = "hakuhodo-tech/japanese-clip-vit-h-14-bert-wider"
         ja_model_path = "./models/ViT-H-14-laion2B-s32B-b79K.bin"
-        if not RUN_LITE:
-            st.session_state.ja_image_model, st.session_state.ja_image_preprocess = (
-                load(ja_model_path, device=device, jit=False)
-            )
         st.session_state.ja_model = AutoModel.from_pretrained(
             ja_model_name, trust_remote_code=True
@@ -216,6 +219,9 @@ def init():
     st.session_state.search_image_ids = []
     st.session_state.search_image_scores = {}
     st.session_state.text_table_df = None
     with st.spinner("Loading models and data, please wait..."):
         load_image_features()
@@ -430,7 +436,7 @@ def visualize_gradcam(image):
     header_cols = st.columns([80, 20], vertical_alignment="bottom")
     with header_cols[0]:
-        st.title("Image + query details")
     with header_cols[1]:
         if st.button("Close"):
             st.rerun()
@@ -457,6 +463,8 @@ def visualize_gradcam(image):
             st.session_state.search_field_value
         )
     with st.spinner("Calculating..."):
         # info_text = st.text("Calculating activation regions...")
@@ -743,6 +751,7 @@ with controls[3]:
         key="uploaded_image",
         label_visibility="collapsed",
         on_change=vis_uploaded_image,
     )
@@ -777,7 +786,9 @@ for image_id in batch:
                 <div>""",
             unsafe_allow_html=True,
         )
-        if not RUN_LITE or st.session_state.active_model == "M-CLIP (multilingual ViT)":
             st.button(
                 "Explain this",
                 on_click=vis_known_image,
@@ -785,4 +796,6 @@ for image_id in batch:
                 use_container_width=True,
                 key=image_id,
             )
     col = (col + 1) % row_size

 from pytorch_grad_cam.grad_cam import GradCAM
+RUN_LITE = True  # Load models for CAM viz for M-CLIP and J-CLIP only
 MAX_IMG_WIDTH = 500
 MAX_IMG_HEIGHT = 800
 def string_search():
+    st.session_state.disable_uploader = (
+        RUN_LITE and st.session_state.active_model == "Legacy (multilingual ResNet)"
+    )
     if "search_field_value" in st.session_state:
         clip_search(st.session_state.search_field_value)
         ja_model_name = "hakuhodo-tech/japanese-clip-vit-h-14-bert-wider"
         ja_model_path = "./models/ViT-H-14-laion2B-s32B-b79K.bin"
+        st.session_state.ja_image_model, st.session_state.ja_image_preprocess = load(
+            ja_model_path, device=device, jit=False
+        )
         st.session_state.ja_model = AutoModel.from_pretrained(
             ja_model_name, trust_remote_code=True
     st.session_state.search_image_ids = []
     st.session_state.search_image_scores = {}
     st.session_state.text_table_df = None
+    st.session_state.disable_uploader = (
+        RUN_LITE and st.session_state.active_model == "Legacy (multilingual ResNet)"
+    )
     with st.spinner("Loading models and data, please wait..."):
         load_image_features()
     header_cols = st.columns([80, 20], vertical_alignment="bottom")
     with header_cols[0]:
+        st.title("Image + query activation gradients")
     with header_cols[1]:
         if st.button("Close"):
             st.rerun()
             st.session_state.search_field_value
         )
+    st.image(image)
     with st.spinner("Calculating..."):
         # info_text = st.text("Calculating activation regions...")
         key="uploaded_image",
         label_visibility="collapsed",
         on_change=vis_uploaded_image,
+        disabled=st.session_state.disable_uploader,
     )
                 <div>""",
             unsafe_allow_html=True,
         )
+        if not (
+            RUN_LITE and st.session_state.active_model == "Legacy (multilingual ResNet)"
+        ):
             st.button(
                 "Explain this",
                 on_click=vis_known_image,
                 use_container_width=True,
                 key=image_id,
             )
+        else:
+            st.empty()
     col = (col + 1) % row_size