HenriqueBraz commited on
Commit
9633d44
·
verified ·
1 Parent(s): 4d36e6a

Update core/pre_processing.py

Browse files
Files changed (1) hide show
  1. core/pre_processing.py +13 -0
core/pre_processing.py CHANGED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import re
2
+ from PIL import Image
3
+
4
+ def clean_text(text):
5
+ text = re.sub(r"<[^>]+>", "", text) # Remove HTML
6
+ text = re.sub(r"[^a-zA-ZÀ-ÿ0-9\s]", "", text) # Remove caracteres especiais
7
+ return text.strip()
8
+
9
+ def resize_image(image, size=(224, 224)):
10
+ return image.resize(size)
11
+
12
+ def normalize_audio(audio_array):
13
+ return audio_array / max(abs(audio_array))