blob: 4c44f5315b481ec6a646344ebe25c4593f33375e [file] [log] [blame]
Search.setIndex({"docnames": ["create", "data", "flight", "index", "io", "schema"], "filenames": ["create.rst", "data.rst", "flight.rst", "index.rst", "io.rst", "schema.rst"], "titles": ["Creating Arrow Objects", "Data Manipulation", "Arrow Flight", "Apache Arrow Python Cookbook", "Reading and Writing Data", "Working with Schema"], "terms": {"recip": [0, 1, 2, 3, 4, 5], "relat": [0, 1, 2, 4], "creation": [0, 5], "tensor": 0, "all": [0, 1, 2, 4, 5], "other": [0, 2], "entiti": [0, 4], "keep": [0, 4], "continu": 0, "optimis": 0, "memori": [0, 2, 3], "footprint": 0, "simd": 0, "analys": 0, "In": [0, 1, 2, 4], "python": [0, 2, 5], "": [0, 1, 2, 4, 5], "possibl": [0, 1, 4, 5], "build": [0, 2], "pyarrow": [0, 1, 2, 3, 4, 5], "start": [0, 2], "list": [0, 1, 2, 4], "sequenc": 0, "gener": [0, 2, 4], "numpi": [0, 4], "panda": [0, 2], "seri": 0, "import": [0, 1, 2, 4, 5], "pa": [0, 1, 2, 4, 5], "1": [0, 1, 2, 4, 5], "2": [0, 1, 2, 4, 5], "3": [0, 1, 2, 4, 5], "4": [0, 1, 2, 4, 5], "5": [0, 1, 2, 4, 5], "print": [0, 1, 2, 4, 5], "can": [0, 1, 2, 4, 5], "also": [0, 1, 2, 3, 4, 5], "provid": [0, 1, 2, 4, 5], "mask": [0, 3], "specifi": 0, "which": [0, 1, 2, 3, 4, 5], "valu": [0, 2, 3, 4], "should": [0, 2, 4], "consid": 0, "null": [0, 1], "np": [0, 4], "true": [0, 1, 2, 4], "fals": [0, 1, 2, 4], "when": [0, 1, 2, 3, 4, 5], "leverag": [0, 2, 4], "optim": [0, 4], "code": [0, 2, 4], "path": [0, 2, 4], "reli": [0, 4], "intern": [0, 2], "represent": 0, "pd": [0, 2], "array_from_numpi": 0, "arang": [0, 4], "array_from_panda": 0, "support": [0, 4], "tabular": 0, "each": [0, 1, 2, 4, 5], "column": [0, 2, 3, 4, 5], "i": [0, 1, 2, 3, 4, 5], "repres": [0, 4], "chunkedarrai": [0, 1, 4], "pair": [0, 1], "multipl": [0, 1, 3, 4], "name": [0, 1, 2, 4, 5], "b": [0, 1, 2, 4, 5], "c": [0, 1, 2, 4, 5], "d": [0, 1, 4, 5], "e": [0, 1, 2, 5], "0": [0, 1, 2, 3, 4, 5], "col1": [0, 4, 5], "col2": [0, 5], "col3": [0, 5], "int64": [0, 1, 4, 5], "string": [0, 1, 2, 5], "doubl": [0, 1, 5], "allow": [0, 2, 4], "fast": 0, "zero": [0, 1], "copi": [0, 1], "structur": [0, 2, 4], "The": [0, 1, 2, 3, 4, 5], "function": [0, 2, 3, 4, 5], "varieti": 0, "input": [0, 4], "includ": [0, 1, 2, 5], "dictionari": [0, 2], "pass": [0, 2, 4], "convers": 0, "benefit": 0, "behaviour": 0, "from_pylist": 0, "method": [0, 1, 2, 4], "row": [0, 1, 2, 4], "dict": [0, 2], "ar": [0, 1, 2, 4, 5], "infer": [0, 4, 5], "schema": [0, 2, 3, 4], "explicitli": 0, "most": [0, 1, 2, 4, 5], "o": 0, "oper": [0, 1, 2, 4], "happen": 0, "ship": 0, "destin": 0, "recordbatch": [0, 4], "wai": [0, 2], "A": [0, 1, 2, 5], "seen": 0, "slice": 0, "from_arrai": [0, 4], "7": [0, 1, 4], "9": [0, 1, 4], "6": [0, 1, 2, 4], "8": [0, 1, 2, 4], "10": [0, 1, 4], "odd": 0, "even": [0, 2], "combin": [0, 1, 2, 5], "us": [0, 2, 3, 4, 5], "from_batch": [0, 2], "second_batch": 0, "11": [0, 1, 4], "13": [0, 4], "15": [0, 1, 4], "17": [0, 4], "19": [0, 4], "12": [0, 1, 4], "14": [0, 1, 4], "16": [0, 3, 4], "18": [0, 4], "20": [0, 1, 4], "equal": [0, 1, 4], "convert": [0, 2, 4, 5], "to_batch": [0, 4], "record_batch": [0, 2, 4], "max_chunks": 0, "len": [0, 1, 2], "dictionaryarrai": 0, "without": [0, 2], "cost": [0, 1], "repeat": [0, 1], "categori": 0, "over": [0, 2], "thi": [0, 2, 3, 4, 5], "reduc": 0, "might": [0, 1, 2, 3, 4, 5], "have": [0, 1, 2, 4, 5], "larg": [0, 2], "text": 0, "If": [0, 1, 2, 4, 5], "you": [0, 1, 2, 4, 5], "an": [0, 2, 3, 4], "contain": [0, 4], "dictionary_encod": 0, "arr": [0, 1, 4, 5], "red": 0, "green": 0, "blue": 0, "indic": 0, "alreadi": [0, 5], "know": 0, "skip": 0, "encod": [0, 2], "step": [0, 2], "directli": [0, 4], "transform": 1, "see": [1, 2], "complet": [1, 4], "avail": [1, 2], "arrow": 1, "those": [1, 3, 4], "expos": [1, 2, 4], "through": [1, 2, 5], "modul": [1, 3, 4], "given": [1, 4], "100": [1, 4], "number": [1, 4], "from": [1, 2, 3], "99": [1, 4], "f": [1, 2, 4], "we": [1, 2, 4, 5], "pc": 1, "49": 1, "And": [1, 2], "min_max": 1, "time": [1, 2, 4], "nums_arr": 1, "entri": [1, 4], "value_count": 1, "common": [1, 2, 3, 4], "multipli": 1, "198": 1, "split": [1, 4], "across": [1, 2], "two": [1, 2], "differ": [1, 4, 5], "concaten": 1, "singl": [1, 2, 4, 5], "oscar": 1, "nomin": 1, "divid": 1, "between": [1, 2], "oscar_nominations_1": 1, "meryl": 1, "streep": 1, "katharin": 1, "hepburn": 1, "21": [1, 4], "actor": 1, "oscar_nominations_2": 1, "jack": 1, "nicholson": 1, "bett": 1, "davi": 1, "them": [1, 2, 4, 5], "concat_t": 1, "oscar_nomin": 1, "By": 1, "default": [1, 2, 4], "doesn": [1, 4], "t": [1, 2, 4], "need": [1, 2, 3, 4], "rewrit": 1, "As": [1, 2], "made": 1, "result": [1, 2, 4], "chunk": [1, 2, 4], "point": [1, 4], "origin": 1, "ha": [1, 2, 4, 5], "been": [1, 4], "under": 1, "some": [1, 2, 4], "condit": 1, "cast": [1, 5], "one": [1, 2, 4, 5], "type": [1, 2, 3, 4], "anoth": [1, 2], "promot": 1, "case": [1, 2, 4], "extra": 1, "occur": 1, "extend": [1, 2], "its": [1, 4, 5], "append_column": 1, "suppos": [1, 2], "actress": 1, "addit": [1, 2], "track": 1, "year": [1, 4], "wa": [1, 2, 5], "won": 1, "wonyear": 1, "1980": 1, "1983": 1, "2012": 1, "1934": 1, "1968": 1, "1969": 1, "1982": 1, "item": 1, "child": [1, 2], "set_column": 1, "inform": [1, 2], "about": [1, 2, 4], "sold": 1, "supermarket": 1, "particular": 1, "dai": [1, 4], "sales_data": 1, "potato": 1, "bean": 1, "cucumb": 1, "egg": 1, "30": 1, "amount": 1, "index": [1, 3], "updat": [1, 2, 4], "sale": 1, "new_sales_data": 1, "new_amount": 1, "40": 1, "kei": [1, 2, 4], "group_bi": 1, "follow": [1, 2, 4], "aggreg": 1, "tablegroupbi": 1, "learn": 1, "more": [1, 2], "groupbi": 1, "here": [1, 2], "For": [1, 2, 4, 5], "exampl": [1, 2, 3, 4, 5], "let": [1, 2, 4], "sai": 1, "set": [1, 2, 3, 4], "associ": 1, "want": [1, 2, 4, 5], "like": [1, 2, 4, 5], "sum": 1, "evalu": 1, "how": [1, 2, 3], "mani": [1, 3], "uniqu": 1, "now": [1, 2], "field": [1, 4, 5], "note": 1, "aggregated_t": 1, "values_sum": 1, "31": [1, 4], "observ": 1, "carefulli": 1, "new": [1, 2], "return": [1, 2, 4], "form": 1, "option": [1, 2, 4], "take": [1, 2], "where": [1, 2, 4], "our": [1, 2], "dataset": [1, 2, 3], "exclud": 1, "sampl": 1, "none": [1, 2, 4], "grouped_t": 1, "countopt": 1, "mode": [1, 4], "only_valid": 1, "values_count": 1, "discuss": 1, "base": 1, "either": [1, 4], "ascend": 1, "descend": 1, "prepar": 1, "123": 1, "Then": [1, 2, 4], "sort_bi": 1, "sorted_t": 1, "look": [1, 4], "sever": [1, 2], "find": 1, "onli": [1, 2, 4], "greater": 1, "than": 1, "could": [1, 2, 4], "get": [1, 2, 4], "back": [1, 2, 4], "fit": [1, 2], "rang": [1, 2, 4], "gtfive": 1, "to_str": 1, "furthermor": 1, "filtered_arrai": 1, "someth": 1, "end": [1, 2], "up": [1, 2], "tell": [1, 4, 5], "posit": 1, "your": [1, 4], "four": 1, "first": [1, 2], "last": 1, "accord": 1, "produc": 1, "output": 1, "so": [1, 2, 4], "found": 1, "protocol": 2, "implement": 2, "store": [2, 3, 4], "send": 2, "receiv": 2, "file": [2, 3], "framework": 2, "particularli": 2, "flightserverbas": 2, "class": [2, 4], "pathlib": 2, "flightserv": 2, "def": 2, "__init__": 2, "self": 2, "locat": [2, 4], "grpc": 2, "8815": 2, "repo": 2, "kwarg": 2, "super": 2, "_locat": 2, "_repo": 2, "_make_flight_info": 2, "dataset_path": 2, "read_schema": 2, "metadata": 2, "read_metadata": 2, "descriptor": 2, "flightdescriptor": 2, "for_path": 2, "utf": 2, "endpoint": 2, "flightendpoint": 2, "flightinfo": 2, "num_row": 2, "serialized_s": 2, "list_flight": 2, "context": 2, "criteria": 2, "iterdir": 2, "yield": 2, "get_flight_info": 2, "decod": [2, 4], "do_put": 2, "reader": 2, "writer": [2, 4], "data_t": 2, "read_al": [2, 4], "write_t": [2, 4], "do_get": 2, "ticket": 2, "recordbatchstream": 2, "read_tabl": [2, 4], "list_act": 2, "drop_dataset": 2, "delet": [2, 4], "do_act": 2, "action": 2, "do_drop_dataset": 2, "bodi": 2, "to_pybyt": 2, "els": 2, "rais": 2, "notimplementederror": 2, "unlink": 2, "server": 2, "charg": 2, "data": [2, 3], "fetch": 2, "likewis": 2, "regard": 2, "specif": 2, "actual": [2, 4], "client": 2, "download": 2, "would": [2, 4, 5], "pretti": 2, "useless": 2, "didn": 2, "creat": [2, 3, 4, 5], "respons": 2, "deal": [2, 5], "save": [2, 3], "request": [2, 5], "add": [2, 4], "do": [2, 4], "custom": 2, "previou": [2, 4], "ad": [2, 3], "execut": 2, "thu": 2, "subclass": 2, "dispatch": 2, "properli": 2, "invok": [2, 4], "expect": 2, "serv": [2, 3], "__name__": 2, "__main__": 2, "mkdir": 2, "exist_ok": 2, "onc": [2, 4], "perform": [2, 3], "tabl": [2, 4], "upload": 2, "mario": 2, "luigi": 2, "peach": 2, "charact": 2, "upload_descriptor": 2, "_": 2, "close": 2, "abl": [2, 4], "retriev": [2, 4], "newli": 2, "total_record": 2, "size": [2, 4], "total_byt": 2, "read": [2, 3, 5], "to_panda": 2, "head": 2, "finish": 2, "drop": 2, "To": [2, 4], "confirm": 2, "current": 2, "exist": [2, 3, 4, 5], "improv": 2, "avoid": 2, "hold": 2, "entir": 2, "iter": [2, 4], "befor": [2, 4], "advantag": 2, "write": [2, 3], "increment": [2, 3], "open": 2, "wb": [2, 4], "sink": [2, 4], "parquetwrit": 2, "parquetfil": 2, "generatorstream": 2, "schema_arrow": 2, "iter_batch": 2, "ve": 2, "modifi": 2, "instead": [2, 4, 5], "batch": [2, 3, 4], "come": [2, 4], "ani": [2, 4], "record": [2, 3, 4], "u": [2, 4], "handl": [2, 4], "don": [2, 4], "while": [2, 4], "mean": [2, 3], "must": [2, 4], "call": [2, 4], "contrast": 2, "requir": [2, 4], "front": 2, "transfer": 2, "pure": 2, "give": 2, "spin": 2, "ll": 2, "had": 2, "num_batch": 2, "1024": 2, "rows_per_batch": 2, "4096": 2, "arrai": [2, 3], "int": 2, "write_batch": 2, "again": 2, "arriv": 2, "total_row": 2, "got": 2, "total": 2, "4194304": 2, "often": 2, "identifi": 2, "who": 2, "thei": [2, 5], "simplest": 2, "scheme": 2, "At": 2, "startup": 2, "itself": 2, "usernam": [2, 4], "author": 2, "token": 2, "futur": 2, "encrypt": 2, "channel": 2, "enabl": 2, "describ": 2, "http": 2, "basic": 2, "doe": 2, "rfc": 2, "7325": 2, "per": 2, "se": 2, "interfac": [2, 4], "demonstr": [2, 3], "below": 2, "minim": 2, "base64": 2, "secret": [2, 4], "echoserv": 2, "just": [2, 4], "echo": 2, "doaction": 2, "basicauthservermiddlewarefactori": 2, "servermiddlewarefactori": 2, "middlewar": 2, "paramet": 2, "cred": 2, "str": 2, "accept": 2, "map": [2, 3], "bearer": 2, "start_cal": 2, "info": 2, "header": 2, "valid": 2, "credenti": [2, 4], "everi": 2, "search": [2, 3], "insensit": 2, "auth_head": 2, "lower": 2, "break": 2, "flightunauthenticatederror": 2, "No": 2, "suppli": 2, "authtyp": 2, "tokenvalu": 2, "g": 2, "random": [2, 4], "auth_typ": 2, "partit": [2, 3], "initi": 2, "login": 2, "same": [2, 4, 5], "auth": 2, "b64decod": 2, "unknown": 2, "invalid": 2, "token_urlsaf": 2, "32": 2, "basicauthservermiddlewar": 2, "elif": 2, "servermiddlewar": 2, "sending_head": 2, "noopauthhandl": 2, "serverauthhandl": 2, "handler": 2, "respond": 2, "handshak": 2, "rpc": 2, "authenticate_basic_token": 2, "otherwis": 2, "op": 2, "outgo": 2, "incom": 2, "is_valid": 2, "auth_handl": 2, "8816": 2, "test": [2, 3], "make": [2, 4], "log": 2, "token_pair": 2, "hello": 2, "world": 2, "flightcallopt": 2, "fail": [2, 5], "error": [2, 4], "try": [2, 4, 5], "except": [2, 5], "unauthent": 2, "runtimeerror": 2, "detail": [2, 4], "Or": 2, "wrong": 2, "scenario": 2, "traffic": 2, "manag": 2, "via": 2, "commun": 2, "layer": 2, "messag": 2, "achiev": 2, "certif": 2, "dure": 2, "develop": 2, "easiest": 2, "approach": 2, "sign": 2, "load": [2, 4], "public": 2, "privat": 2, "root": 2, "product": 2, "environ": 2, "recommend": 2, "dotnet": 2, "window": [2, 4], "openssl": 2, "linux": [2, 4], "maco": 2, "altern": 2, "repositori": 2, "depend": 2, "mai": 2, "crt": 2, "One": 2, "pleas": 2, "visit": 2, "ibm": 2, "articl": 2, "run": 2, "work": [2, 3], "argpars": 2, "host": 2, "localhost": 2, "tls_certif": 2, "verify_cli": 2, "root_certif": 2, "classmethod": 2, "descriptor_to_kei": 2, "descriptor_typ": 2, "command": 2, "tupl": 2, "main": 2, "parser": 2, "argumentpars": 2, "add_argu": 2, "narg": 2, "metavar": 2, "certfil": 2, "keyfil": 2, "arg": 2, "parse_arg": 2, "port": 2, "5005": 2, "rb": 2, "cert_fil": 2, "tls_cert_chain": 2, "key_fil": 2, "tls_private_kei": 2, "append": [2, 3], "format": [2, 4], "push": 2, "assum": 2, "object": [2, 3, 4, 5], "datafram": 2, "push_to_serv": 2, "object_to_send": 2, "from_panda": 2, "help": 2, "trust": 2, "tls_root": 2, "root_cert": 2, "tls_root_cert": 2, "flightclient": 2, "anim": 2, "dog": 2, "cat": 2, "mous": 2, "big": [2, 4], "small": 2, "tini": 2, "df": 2, "animaldata": 2, "script": 2, "out": [2, 4], "distribut": 2, "collect": [2, 3], "level": 2, "measur": 2, "order": 2, "correl": 2, "span": 2, "manual": [2, 4, 5], "automat": [2, 5], "show": 2, "accomplish": 2, "inject": 2, "extract": 2, "side": 2, "defin": [2, 5], "statu": 2, "statuscod": 2, "clienttracingmiddlewarefactori": 2, "clientmiddlewarefactori": 2, "_tracer": 2, "get_trac": 2, "start_span": 2, "clienttracingmiddlewar": 2, "clientmiddlewar": 2, "_span": 2, "ctx": 2, "set_span_in_context": 2, "carrier": 2, "call_complet": 2, "record_except": 2, "set_statu": 2, "ok": 2, "servertracingmiddlewarefactori": 2, "servertracingmiddlewar": 2, "configur": 2, "export": 2, "processor": 2, "both": [2, 4], "sdk": 2, "somewher": 2, "sake": 2, "normal": [2, 4], "jaeger": 2, "part": [2, 4], "resourc": 2, "minimum": 2, "hostnam": 2, "process": 2, "id": [2, 4], "version": 2, "system": [2, 5], "tracerprovid": 2, "simplespanprocessor": 2, "service_nam": 2, "spanexport": 2, "spanexportresult": 2, "testspanexport": 2, "success": 2, "configure_trac": 2, "backend": 2, "although": 2, "necessari": [2, 5], "consol": 2, "good": 2, "anywai": 2, "attribut": 2, "my": 2, "add_span_processor": 2, "set_tracer_provid": 2, "earlier": 2, "within": [2, 4], "activ": 2, "pick": 2, "tracer": 2, "start_as_current_span": 2, "hello_world": 2, "drain": 2, "There": 2, "n": [2, 4], "status_cod": 2, "flightmethod": 2, "unset": 2, "three": 2, "solv": 3, "task": 3, "user": [3, 4], "robust": 3, "well": 3, "solut": 3, "dev273": 3, "parquet": 3, "subset": 3, "disk": 3, "csv": 3, "s3": 3, "feather": 3, "line": 3, "delimit": 3, "json": 3, "compress": 3, "plain": 3, "categor": 3, "merg": 3, "manipul": 3, "comput": 3, "min": 3, "max": 3, "count": 3, "occurr": 3, "element": 3, "appli": [3, 5], "arithmet": 3, "replac": 3, "group": [3, 5], "sort": [3, 4], "match": 3, "predic": 3, "filter": [3, 4], "flight": 3, "simpl": 3, "storag": 3, "servic": 3, "stream": 3, "authent": 3, "password": 3, "secur": 3, "connect": 3, "tl": 3, "propag": 3, "opentelemetri": 3, "trace": 3, "page": 3, "apach": 4, "written": 4, "pq": 4, "95": 4, "96": 4, "97": 4, "98": 4, "restrict": 4, "argument": 4, "project": 4, "refer": 4, "document": 4, "syntax": 4, "apart": 4, "dump": 4, "raw": 4, "direct": 4, "ipc": 4, "num": 4, "osfil": 4, "arraydata": 4, "new_fil": 4, "were": 4, "adapt": 4, "accordingli": 4, "memory_map": 4, "r": 4, "sourc": [4, 5], "loaded_arrai": 4, "open_fil": 4, "It": 4, "write_csv": 4, "write_opt": 4, "writeopt": 4, "include_head": 4, "whole": 4, "csvwriter": 4, "int32": [4, 5], "datachunk": 4, "codepath": 4, "thread": 4, "read_csv": 4, "best": 4, "further": 4, "drive": 4, "convertopt": 4, "usual": 4, "sens": 4, "separ": [4, 5], "write_dataset": 4, "effort": 4, "birthdai": 4, "2000": 4, "2009": 4, "randint": 4, "month": 4, "x": 4, "int16": 4, "subdirectori": 4, "directori": 4, "localf": 4, "localfilesystem": 4, "partitioned_dir_cont": 4, "get_file_info": 4, "fileselector": 4, "recurs": 4, "filetyp": 4, "2001": 4, "2002": 4, "2003": 4, "2004": 4, "2005": 4, "2006": 4, "2007": 4, "2008": 4, "compos": 4, "piec": 4, "discov": 4, "dataset1": 4, "dataset2": 4, "dataset3": 4, "view": 4, "to_tabl": 4, "22": 4, "23": 4, "24": 4, "25": 4, "26": 4, "27": 4, "28": 4, "29": 4, "notic": 4, "forc": 4, "what": [4, 5], "reason": 4, "better": 4, "_name": 4, "abstract": 4, "remot": 4, "hdf": 4, "ursa": 4, "lab": 4, "taxi": 4, "2011": 4, "subtreefilesystem": 4, "s3filesystem": 4, "region": 4, "east": 4, "anonym": 4, "01": 4, "02": 4, "03": 4, "04": 4, "05": 4, "06": 4, "07": 4, "08": 4, "09": 4, "bucket": 4, "local": 4, "abov": 4, "throw": 4, "aw": 4, "instruct": 4, "access": 4, "mac": 4, "appropri": [4, 5], "aws_access_key_id": 4, "your_aws_access_key_id": 4, "aws_secret_access_kei": 4, "your_aws_secret_access_kei": 4, "ft": 4, "write_feath": 4, "builtin": 4, "tempfil": 4, "namedtemporaryfil": 4, "w": 4, "read_json": 4, "to_pydict": 4, "nativ": 4, "box": 4, "driven": 4, "lz4": 4, "snappi": 4, "compressedoutputstream": 4, "gz": 4, "gzip": 4, "decompress": 4, "done": [4, 5], "compressedinputstream": 4, "explain": 4, "next": 4, "applic": 4, "special": 4, "wrote": 4, "simpli": 4, "table_feath": 4, "table_parquet": 4, "involv": 4, "wrap": 4, "table_csv": 4, "smart": 4, "enough": 4, "detect": 4, "extens": 4, "bz2": 4, "table_csv2": 4, "howev": 5, "ensur": 5, "interoper": 5, "databas": 5, "warehous": 5, "chapter": 5, "chang": 5, "int8": 5, "detain": 5, "own": 5, "union": 5, "float64": 5, "far": 5, "compat": 5, "schema_int32": 5, "unifi": 5, "superset": 5, "first_schema": 5, "countri": 5, "popul": 5, "second_schema": 5, "country_cod": 5, "languag": 5, "unify_schema": 5, "union_schema": 5, "overlap": 5, "still": 5, "collid": 5, "retain": 5, "third_schema": 5, "lat": 5, "float32": 5, "long": 5, "float": 5, "diverg": 5, "numer": 5, "unabl": 5, "becaus": 5, "declar": 5, "arrowinvalid": 5, "arrowtypeerror": 5, "incompat": 5, "v": 5}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"creat": 0, "arrow": [0, 2, 3, 4, 5], "object": 0, "content": [0, 1, 2, 3, 4, 5], "arrai": [0, 1, 4, 5], "tabl": [0, 1, 3, 5], "from": [0, 4], "plain": 0, "type": [0, 5], "record": 0, "batch": 0, "store": 0, "categor": 0, "data": [0, 1, 4, 5], "manipul": 1, "comput": 1, "mean": 1, "min": 1, "max": 1, "valu": 1, "an": [1, 5], "count": 1, "occurr": 1, "element": 1, "appli": 1, "arithmet": 1, "function": 1, "append": 1, "exist": 1, "ad": 1, "column": 1, "replac": 1, "group": 1, "sort": 1, "search": 1, "match": 1, "predic": 1, "filter": 1, "us": 1, "mask": 1, "flight": 2, "simpl": 2, "parquet": [2, 4], "storag": 2, "servic": 2, "stream": 2, "authent": 2, "user": 2, "password": 2, "secur": 2, "connect": 2, "tl": 2, "propag": 2, "opentelemetri": 2, "trace": 2, "apach": 3, "python": 3, "cookbook": 3, "indic": 3, "read": 4, "write": 4, "file": 4, "subset": 4, "save": 4, "disk": 4, "memori": 4, "map": 4, "csv": 4, "increment": 4, "partit": 4, "dataset": 4, "s3": 4, "feather": 4, "line": 4, "delimit": 4, "json": 4, "compress": 4, "work": 5, "schema": 5, "set": 5, "merg": 5, "multipl": 5}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinx": 60}, "alltitles": {"Creating Arrow Objects": [[0, "creating-arrow-objects"]], "Contents": [[0, "contents"], [1, "contents"], [2, "contents"], [5, "contents"], [4, "contents"]], "Creating Arrays": [[0, "creating-arrays"]], "Creating Tables": [[0, "creating-tables"]], "Create Table from Plain Types": [[0, "create-table-from-plain-types"]], "Creating Record Batches": [[0, "creating-record-batches"]], "Store Categorical Data": [[0, "store-categorical-data"]], "Data Manipulation": [[1, "data-manipulation"]], "Computing Mean/Min/Max values of an array": [[1, "computing-mean-min-max-values-of-an-array"]], "Counting Occurrences of Elements": [[1, "counting-occurrences-of-elements"]], "Applying arithmetic functions to arrays.": [[1, "applying-arithmetic-functions-to-arrays"]], "Appending tables to an existing table": [[1, "appending-tables-to-an-existing-table"]], "Adding a column to an existing Table": [[1, "adding-a-column-to-an-existing-table"]], "Replacing a column in an existing Table": [[1, "replacing-a-column-in-an-existing-table"]], "Group a Table": [[1, "group-a-table"]], "Sort a Table": [[1, "sort-a-table"]], "Searching for values matching a predicate in Arrays": [[1, "searching-for-values-matching-a-predicate-in-arrays"]], "Filtering Arrays using a mask": [[1, "filtering-arrays-using-a-mask"]], "Arrow Flight": [[2, "arrow-flight"]], "Simple Parquet storage service with Arrow Flight": [[2, "simple-parquet-storage-service-with-arrow-flight"]], "Streaming Parquet Storage Service": [[2, "streaming-parquet-storage-service"]], "Authentication with user/password": [[2, "authentication-with-user-password"]], "Securing connections with TLS": [[2, "securing-connections-with-tls"]], "Propagating OpenTelemetry Traces": [[2, "propagating-opentelemetry-traces"]], "Apache Arrow Python Cookbook": [[3, "apache-arrow-python-cookbook"]], "Contents:": [[3, null]], "Indices and tables": [[3, "indices-and-tables"]], "Working with Schema": [[5, "working-with-schema"]], "Setting the data type of an Arrow Array": [[5, "setting-the-data-type-of-an-arrow-array"]], "Setting the schema of a Table": [[5, "setting-the-schema-of-a-table"]], "Merging multiple schemas": [[5, "merging-multiple-schemas"]], "Reading and Writing Data": [[4, "reading-and-writing-data"]], "Write a Parquet file": [[4, "write-a-parquet-file"]], "Reading a Parquet file": [[4, "reading-a-parquet-file"]], "Reading a subset of Parquet data": [[4, "reading-a-subset-of-parquet-data"]], "Saving Arrow Arrays to disk": [[4, "saving-arrow-arrays-to-disk"]], "Memory Mapping Arrow Arrays from disk": [[4, "memory-mapping-arrow-arrays-from-disk"]], "Writing CSV files": [[4, "writing-csv-files"]], "Writing CSV files incrementally": [[4, "writing-csv-files-incrementally"]], "Reading CSV files": [[4, "reading-csv-files"]], "Writing Partitioned Datasets": [[4, "writing-partitioned-datasets"]], "Reading Partitioned data": [[4, "reading-partitioned-data"]], "Reading Partitioned Data from S3": [[4, "reading-partitioned-data-from-s3"]], "Write a Feather file": [[4, "write-a-feather-file"]], "Reading a Feather file": [[4, "reading-a-feather-file"]], "Reading Line Delimited JSON": [[4, "reading-line-delimited-json"]], "Writing Compressed Data": [[4, "writing-compressed-data"]], "Reading Compressed Data": [[4, "reading-compressed-data"]]}, "indexentries": {}})