Spaces:

sk2003
/

InteriorVision

Sleeping

App Files Files Community

sk2003 commited on Aug 29

Commit

0747848

•

1 Parent(s): 73142ed

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -11

app.py CHANGED Viewed

@@ -6,30 +6,33 @@ from PIL import Image
 from huggingface_hub import hf_hub_download
 import torch.nn as nn
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-# Finetuned Resnet-50 model is downloaded
 vgg16_model_path = hf_hub_download(repo_id="sk2003/style_recognizer_vgg", filename="vgg16_model.pth")
 vgg16 = models.vgg16(pretrained=True)
 for param in vgg16.parameters():
-    param.requires_grad = False # freezing parameters
 num_classes = 8
-vgg16.fc = nn.Linear(vgg16.fc.in_features, num_classes)
 vgg16 = vgg16.to(device)
-# Loading the model
 checkpoint = torch.load(vgg16_model_path, map_location=device)
 vgg16.load_state_dict(checkpoint['model_state_dict'])
-vgg16.eval() # setting to evaluation mode to disable batch-norm and dropout layers
-# Fine-tuned Stable Diffusion model
 model_id = "sk2003/room-styler"
 pipe = StableDiffusionPipeline.from_pretrained(model_id, torch_dtype=torch.float16)
 pipe.to(device)
-# Prediction function for the ResNet50 model
 def predict(image):
     transform = transforms.Compose([
         transforms.Resize((224, 224)),
@@ -39,7 +42,7 @@ def predict(image):
     image_tensor = transform(image).unsqueeze(0).to(device)
     with torch.no_grad():
-        outputs = resnet50(image_tensor)
         _, predicted = torch.max(outputs.data, 1)
     classes = ["Classic", "Modern", "Vintage", "Glamour", "Scandinavian", "Rustic", "ArtDeco", "Industrial"]
@@ -54,9 +57,9 @@ def generate_image(prompt):
 # Gradio interface
 with gr.Blocks() as demo:
-    gr.Markdown("## Room Style Recognition and Generation") # title
-   # 1st tab
     with gr.Tab("Recognize Room Style"):
         image_input = gr.Image(type="pil")
         label_output = gr.Textbox()
@@ -71,4 +74,3 @@ with gr.Blocks() as demo:
         btn_generate.click(generate_image, inputs=text_input, outputs=image_output)
 demo.launch()

 from huggingface_hub import hf_hub_download
 import torch.nn as nn
+# Set the device
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# Download the fine-tuned VGG16 model
 vgg16_model_path = hf_hub_download(repo_id="sk2003/style_recognizer_vgg", filename="vgg16_model.pth")
+# Load the VGG16 model with pre-trained weights
 vgg16 = models.vgg16(pretrained=True)
 for param in vgg16.parameters():
+    param.requires_grad = False  # Freeze parameters
+# Update the last fully connected layer to match the number of classes
 num_classes = 8
+vgg16.classifier[6] = nn.Linear(vgg16.classifier[6].in_features, num_classes)
 vgg16 = vgg16.to(device)
+# Load the fine-tuned model state
 checkpoint = torch.load(vgg16_model_path, map_location=device)
 vgg16.load_state_dict(checkpoint['model_state_dict'])
+vgg16.eval()  # Set the model to evaluation mode
+# Load the fine-tuned Stable Diffusion model
 model_id = "sk2003/room-styler"
 pipe = StableDiffusionPipeline.from_pretrained(model_id, torch_dtype=torch.float16)
 pipe.to(device)
+# Prediction function for the VGG16 model
 def predict(image):
     transform = transforms.Compose([
         transforms.Resize((224, 224)),
     image_tensor = transform(image).unsqueeze(0).to(device)
     with torch.no_grad():
+        outputs = vgg16(image_tensor)
         _, predicted = torch.max(outputs.data, 1)
     classes = ["Classic", "Modern", "Vintage", "Glamour", "Scandinavian", "Rustic", "ArtDeco", "Industrial"]
 # Gradio interface
 with gr.Blocks() as demo:
+    gr.Markdown("## Room Style Recognition and Generation")  # Title
+    # 1st tab
     with gr.Tab("Recognize Room Style"):
         image_input = gr.Image(type="pil")
         label_output = gr.Textbox()
         btn_generate.click(generate_image, inputs=text_input, outputs=image_output)
 demo.launch()