ZennyKenny commited on
Commit
3fa52bd
·
verified ·
1 Parent(s): fd11c5a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -2
app.py CHANGED
@@ -2,13 +2,12 @@ import gradio as gr
2
  from transformers import TrOCRProcessor, VisionEncoderDecoderModel
3
  from PIL import Image
4
  import torch
5
- import spaces
6
 
7
  # Load TrOCR model
8
  processor = TrOCRProcessor.from_pretrained("microsoft/trocr-large-handwritten")
9
  model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-large-handwritten")
10
 
11
- @spaces.GPU
12
  def recognize_text(image):
13
  try:
14
  # Convert image to RGB if it's not already
@@ -19,6 +18,11 @@ def recognize_text(image):
19
  pixel_values = processor(images=image, return_tensors="pt").pixel_values
20
  print("Image preprocessed. Pixel values shape:", pixel_values.shape)
21
 
 
 
 
 
 
22
  # Generate text from the image
23
  with torch.no_grad(): # Disable gradient calculation for inference
24
  generated_ids = model.generate(pixel_values)
 
2
  from transformers import TrOCRProcessor, VisionEncoderDecoderModel
3
  from PIL import Image
4
  import torch
5
+ import matplotlib.pyplot as plt
6
 
7
  # Load TrOCR model
8
  processor = TrOCRProcessor.from_pretrained("microsoft/trocr-large-handwritten")
9
  model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-large-handwritten")
10
 
 
11
  def recognize_text(image):
12
  try:
13
  # Convert image to RGB if it's not already
 
18
  pixel_values = processor(images=image, return_tensors="pt").pixel_values
19
  print("Image preprocessed. Pixel values shape:", pixel_values.shape)
20
 
21
+ # Visualize preprocessed image
22
+ plt.imshow(pixel_values.squeeze().permute(1, 2, 0))
23
+ plt.title("Preprocessed Image")
24
+ plt.show()
25
+
26
  # Generate text from the image
27
  with torch.no_grad(): # Disable gradient calculation for inference
28
  generated_ids = model.generate(pixel_values)