First, a quick code example of K-Means in Scikit-learn
from sklearn.datasets import make_blobs
from sklearn.cluster import KMeans
n_centers = 5
X, _ = make_blobs(n_samples=10000, n_centers=n_centers)
wget https://download.dremio.com/odbc-driver/1.4.2.1003/dremio-odbc-1.4.2.1003-1.x86_64.rpm | |
sudo apt-get install alien unixodbc-dev -y | |
sudo alien dremio-odbc-1.4.2.1003-1.x86_64.rpm | |
sudo dpkg -i dremio-odbc_1.4.2.1003-2_amd64.deb |
from collections import namedtuple | |
import vaex | |
import time | |
import orjson | |
import os | |
import psutil | |
from pyarrow import flight | |
import pyarrow as pa |
from collections import namedtuple | |
import vaex | |
import time | |
import orjson | |
import os | |
import psutil | |
from pyarrow import flight | |
import pyarrow as pa |