%%pyspark
spark #spark session
spark.sql #SQL Context
spark.catalog # Hive Context
PySpark is the Python library for Spark programming. It allows you to use the powerful and efficient data processing capabilities of Apache Spark from within the Python programming language. PySpark provides a high-level API for distributed data processing that can be used to perform common data analysis tasks, such as filtering, aggregation, and transformation of large datasets.
Pandas is a Python library for data manipulation and analysis. It provides powerful data structures, such as the DataFrame and Series, that are designed to make it easy to work with structured data in Python. With pandas, you can perform a wide range of data analysis tasks, such as filtering, aggregation, and transformation of data, as well as data cleaning and preparation.
PySpark | Pandas |
---|
^(?:(?:31(\/|-|\.)(?:0?[13578]|1[02]|(?:Jan|Mar|May|Jul|Aug|Oct|Dec)))\1|(?:(?:29|30)(\/|-|\.)(?:0?[1,3-9]|1[0-2]|(?:Jan|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec))\2))(?:(?:1[6-9]|[2-9]\d)?\d{2})$|^(?:29(\/|-|\.)(?:0?2|(?:Feb))\3(?:(?:(?:1[6-9]|[2-9]\d)?(?:0[48]|[2468][048]|[13579][26])|(?:(?:16|[2468][048]|[3579][26])00))))$|^(?:0?[1-9]|1\d|2[0-8])(\/|-|\.)(?:(?:0?[1-9]|(?:Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep))|(?:1[0-2]|(?:Oct|Nov|Dec)))\4(?:(?:1[6-9]|[2-9]\d)?\d{2})$
import glob | |
import os | |
import time | |
dir_name = '/content/drive/MyDrive/' | |
target_date = datetime.datetime.strptime('2023-03-30', '%Y-%m-%d').date() | |
print(target_date) | |
# Get list of all files only in the given directory |
import io | |
import requests; | |
import pathlib; | |
from PIL import Image | |
# =================================================================== # | |
def download_image(url): | |
filename = url.split('/')[-1]; | |
print(f"Filename : {filename}") |
#!/bin/bash | |
# https://gist.github.com/princeppy/dd3ca67e3233589aa7ab102568806f4b | |
# https://mathiasbynens.be/notes/shell-script-mac-apps | |
if [ "$1" = "-h" -o "$1" = "--help" -o -z "$1" ]; then cat <<EOF | |
appify v3.0.1 for Mac OS X - http://mths.be/appify | |
Creates the simplest possible Mac app from a shell script. | |
Appify takes a shell script as its first argument: |
<?php | |
/** | |
* Programmatically install and activate wordpress plugins | |
* | |
* Usage: | |
* 1. Edit the $pluginSlugs array at the beginning of this file to include the slugs of all the | |
* plugins you want to install and activate | |
* 2. Upload this file to the wordpress root directory (the same directory that contains the | |
* 'wp-admin' directory). | |
* 3. Navigate to <your-domain-wordpress-root>/install-wp-plugins.php (If wordpress is installed |
CREATE FUNCTION [dbo].[SplitCSV] | |
(@CSV VARCHAR (MAX)) | |
RETURNS @OutTable TABLE ([ID] VARCHAR (255) NOT NULL) | |
AS BEGIN | |
--hold the current cursor position | |
declare @currentposition int | |
--hold the next position index of the cursor. | |
declare @nextposition int |
type Omit<T, K extends keyof T> = Pick<T, Exclude<keyof T, K>>; | |
export function withAppContext< | |
P extends { appContext?: AppContextInterface }, | |
R = Omit<P, 'appContext'> | |
>( | |
Component: React.ComponentClass<P> | React.StatelessComponent<P> | |
): React.SFC<R> { | |
return function BoundComponent(props: R) { | |
return ( |