You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
def__init__(self, dataset_path="movies_metadata.csv", sample_size=1000):
# Connect to Qdrant Cloudself.client=QdrantClient(
url=os.getenv("QDRANT_URL_LOCAL"),
timeout=300
)
self.model=SentenceTransformer('all-MiniLM-L6-v2', device='mps') # Adjust device if neededself.collection_name="movies_large"# Load and preprocess movie datasetself._load_dataset(dataset_path, sample_size)
self._initialize_collection()
def_load_dataset(self, dataset_path, sample_size=1000):
"""Load and sample movie data from CSV."""def_initialize_collection(self):
"""Create or reset the collection and upload data."""ifself.client.collection_exists(self.collection_name):
self.client.delete_collection(self.collection_name)
print(f"Collection '{self.collection_name}' deleted.")
self.client.create_collection(
collection_name=self.collection_name,
vectors_config=VectorParams(size=384, distance=Distance.COSINE),
optimizers_config=models.OptimizersConfigDiff(
indexing_threshold=0,
),
shard_number=2,
)
points= [
PointStruct(
id=idx,
vector=vector,
payload={"title": movie["title"], "description": movie["description"]}
)
foridx, (vector, movie) inenumerate(zip(self.vectors, self.movies))
]
self.client.upsert(
collection_name=self.collection_name,
points=points,
)
print(f"Collection '{self.collection_name}' initialized with {len(points)} points.")
When I uploaded 1,000 points, it worked fine. But with 10,000 points, it gets stuck and doesn’t send the data to the client. I checked the bulk upload documentation but didn’t find anything helpful. My device has plenty of free RAM, so I don’t think it’s a memory issue.
The text was updated successfully, but these errors were encountered:
When I uploaded 1,000 points, it worked fine. But with 10,000 points, it gets stuck and doesn’t send the data to the client. I checked the bulk upload documentation but didn’t find anything helpful. My device has plenty of free RAM, so I don’t think it’s a memory issue.
The text was updated successfully, but these errors were encountered: