Spaces:

leadr64
/

database

Configuration error

App Files Files Community

leadr64 commited on Jun 12, 2024

Commit

a51a160

1 Parent(s): 1689e46

Ajouter le script Gradio et les dépendances

Browse files

Files changed (5) hide show

.env +2 -0
Dockerfile +8 -0
app.py +11 -6
database.py +18 -16
docker-compose.yml +6 -0

.env ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ QDRANT_HOST=localhost
2	+ QDRANT_PORT=6333

Dockerfile ADDED Viewed

	@@ -0,0 +1,8 @@

+# Utilisez une image de base pour Qdrant
+FROM qdrant/qdrant
+# Exposez le port par défaut de Qdrant
+EXPOSE 6333
+# Commande pour démarrer Qdrant
+CMD ["qdrant"]

app.py CHANGED Viewed

@@ -1,18 +1,23 @@
 import gradio as gr
 import laion_clap
 from qdrant_client import QdrantClient
-# Loading the Qdrant DB in local ###################################################################
-client = QdrantClient("localhost", port=6333)
 print("[INFO] Client created...")
-# loading the model
 print("[INFO] Loading the model...")
 model_name = "laion/larger_clap_music"
 model = laion_clap.CLAP_Module(enable_fusion=False)
-model.load_ckpt()  # download the default pretrained checkpoint.
-# Gradio Interface #################################################################################
 max_results = 10
 def sound_search(query):
@@ -34,7 +39,7 @@ with gr.Blocks() as demo:
         """# Sound search database """
     )
     inp = gr.Textbox(placeholder="What sound are you looking for ?")
-    out = [gr.Audio(label=f"{x}") for x in range(max_results)]  # Necessary to have different objs
     inp.change(sound_search, inp, out)
 demo.launch()

 import gradio as gr
 import laion_clap
 from qdrant_client import QdrantClient
+import os
+# Utilisez les variables d'environnement pour la configuration
+QDRANT_HOST = os.getenv('QDRANT_HOST', 'localhost')
+QDRANT_PORT = int(os.getenv('QDRANT_PORT', 6333))
+# Connexion à Qdrant
+client = QdrantClient(QDRANT_HOST, port=QDRANT_PORT)
 print("[INFO] Client created...")
+# Charger le modèle
 print("[INFO] Loading the model...")
 model_name = "laion/larger_clap_music"
 model = laion_clap.CLAP_Module(enable_fusion=False)
+model.load_ckpt()  # télécharger le checkpoint préentraîné par défaut
+# Interface Gradio
 max_results = 10
 def sound_search(query):
         """# Sound search database """
     )
     inp = gr.Textbox(placeholder="What sound are you looking for ?")
+    out = [gr.Audio(label=f"{x}") for x in range(max_results)]  # Nécessaire pour avoir différents objets
     inp.change(sound_search, inp, out)
 demo.launch()

database.py CHANGED Viewed

@@ -8,8 +8,11 @@ from qdrant_client import QdrantClient
 from qdrant_client.http import models
 from tqdm import tqdm
-# Functions utils ##################################################################################
 def get_md5(fpath):
     with open(fpath, "rb") as f:
         file_hash = hashlib.md5()
@@ -17,52 +20,51 @@ def get_md5(fpath):
             file_hash.update(chunk)
     return file_hash.hexdigest()
-# PARAMETERS #######################################################################################
 CACHE_FOLDER = '/home/nahia/data/audio/'
 KAGGLE_TRAIN_PATH = '/home/nahia/Documents/audio/actor/Actor_01/'
-# ################## Loading the CLAP model ###################
 print("[INFO] Loading the model...")
 model_name = 'music_speech_epoch_15_esc_89.25.pt'
 model = laion_clap.CLAP_Module(enable_fusion=False)
-model.load_ckpt()  # download the default pretrained checkpoint.
-# Initialize the cache
 os.makedirs(CACHE_FOLDER, exist_ok=True)
 cache = Cache(CACHE_FOLDER)
-# Embed the audio files !
 audio_files = [p for p in glob(os.path.join(KAGGLE_TRAIN_PATH, '*.wav'))]
 audio_embeddings = []
 chunk_size = 100
 total_chunks = int(len(audio_files) / chunk_size)
-# Use tqdm for a progress bar
 for i in tqdm(range(0, len(audio_files), chunk_size), total=total_chunks):
-    chunk = audio_files[i:i + chunk_size]  # Get a chunk of audio files
     chunk_embeddings = []
     for audio_file in chunk:
-        # Compute a unique hash for the audio file
         file_key = get_md5(audio_file)
         if file_key in cache:
-            # If the embedding for this file is cached, retrieve it
             embedding = cache[file_key]
         else:
-            # Otherwise, compute the embedding and cache it
             embedding = model.get_audio_embedding_from_filelist(x=[audio_file], use_tensor=False)[
-                0]  # Assuming the model returns a list
             cache[file_key] = embedding
         chunk_embeddings.append(embedding)
     audio_embeddings.extend(chunk_embeddings)
-# It's a good practice to close the cache when done
 cache.close()
-# Creating a qdrant collection #####################################################################
-client = QdrantClient("localhost", port=6333)
 print("[INFO] Client created...")
 print("[INFO] Creating qdrant data collection...")

 from qdrant_client.http import models
 from tqdm import tqdm
+# Utiliser les variables d'environnement pour la configuration
+QDRANT_HOST = os.getenv('QDRANT_HOST', 'localhost')
+QDRANT_PORT = int(os.getenv('QDRANT_PORT', 6333))
+# Functions utils
 def get_md5(fpath):
     with open(fpath, "rb") as f:
         file_hash = hashlib.md5()
             file_hash.update(chunk)
     return file_hash.hexdigest()
+# PARAMETERS
 CACHE_FOLDER = '/home/nahia/data/audio/'
 KAGGLE_TRAIN_PATH = '/home/nahia/Documents/audio/actor/Actor_01/'
+# Charger le modèle CLAP
 print("[INFO] Loading the model...")
 model_name = 'music_speech_epoch_15_esc_89.25.pt'
 model = laion_clap.CLAP_Module(enable_fusion=False)
+model.load_ckpt()  # télécharger le checkpoint préentraîné par défaut
+# Initialiser le cache
 os.makedirs(CACHE_FOLDER, exist_ok=True)
 cache = Cache(CACHE_FOLDER)
+# Embarquer les fichiers audio
 audio_files = [p for p in glob(os.path.join(KAGGLE_TRAIN_PATH, '*.wav'))]
 audio_embeddings = []
 chunk_size = 100
 total_chunks = int(len(audio_files) / chunk_size)
+# Utiliser tqdm pour une barre de progression
 for i in tqdm(range(0, len(audio_files), chunk_size), total=total_chunks):
+    chunk = audio_files[i:i + chunk_size]  # Obtenir un chunk de fichiers audio
     chunk_embeddings = []
     for audio_file in chunk:
+        # Calculer un hash unique pour le fichier audio
         file_key = get_md5(audio_file)
         if file_key in cache:
+            # Si l'embedding pour ce fichier est en cache, le récupérer
             embedding = cache[file_key]
         else:
+            # Sinon, calculer l'embedding et le mettre en cache
             embedding = model.get_audio_embedding_from_filelist(x=[audio_file], use_tensor=False)[
+                0]  # Assumer que le modèle retourne une liste
             cache[file_key] = embedding
         chunk_embeddings.append(embedding)
     audio_embeddings.extend(chunk_embeddings)
+# Fermer le cache quand terminé
 cache.close()
+# Créer une collection qdrant
+client = QdrantClient(QDRANT_HOST, port=QDRANT_PORT)
 print("[INFO] Client created...")
 print("[INFO] Creating qdrant data collection...")

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,6 @@

+version: '3.8'
+services:
+  qdrant:
+    build: .
+    ports:
+      - "6333:6333"