|
2 | 2 | "cells": [
|
3 | 3 | {
|
4 | 4 | "cell_type": "markdown",
|
| 5 | + "metadata": { |
| 6 | + "collapsed": false |
| 7 | + }, |
5 | 8 | "source": [
|
6 | 9 | "# CrateDB Cloud Import\n",
|
7 | 10 | "\n",
|
|
20 | 23 | "## Setup\n",
|
21 | 24 | "\n",
|
22 | 25 | "To install the client SDK, use `pip`."
|
23 |
| - ], |
24 |
| - "metadata": { |
25 |
| - "collapsed": false |
26 |
| - } |
| 26 | + ] |
27 | 27 | },
|
28 | 28 | {
|
29 | 29 | "cell_type": "code",
|
30 | 30 | "execution_count": null,
|
| 31 | + "metadata": { |
| 32 | + "collapsed": false |
| 33 | + }, |
31 | 34 | "outputs": [],
|
32 | 35 | "source": [
|
33 | 36 | "#!pip install 'cratedb-toolkit'"
|
34 |
| - ], |
35 |
| - "metadata": { |
36 |
| - "collapsed": false |
37 |
| - } |
| 37 | + ] |
38 | 38 | },
|
39 | 39 | {
|
40 | 40 | "cell_type": "markdown",
|
| 41 | + "metadata": { |
| 42 | + "collapsed": false |
| 43 | + }, |
41 | 44 | "source": [
|
42 | 45 | "## Configuration\n",
|
43 | 46 | "\n",
|
|
56 | 59 | "CRATEDB_USERNAME='admin'\n",
|
57 | 60 | "CRATEDB_PASSWORD='H3IgNXNvQBJM3CiElOiVHuSp6CjXMCiQYhB4I9dLccVHGvvvitPSYr1vTpt4'\n",
|
58 | 61 | "```"
|
59 |
| - ], |
60 |
| - "metadata": { |
61 |
| - "collapsed": false |
62 |
| - } |
| 62 | + ] |
63 | 63 | },
|
64 | 64 | {
|
65 | 65 | "cell_type": "markdown",
|
| 66 | + "metadata": { |
| 67 | + "collapsed": false |
| 68 | + }, |
66 | 69 | "source": [
|
67 | 70 | "## Acquire Database Cluster\n",
|
68 | 71 | "\n",
|
|
71 | 74 | "\n",
|
72 | 75 | "For effortless configuration, it will obtain configuration settings from\n",
|
73 | 76 | "environment variables as defined above."
|
74 |
| - ], |
75 |
| - "metadata": { |
76 |
| - "collapsed": false |
77 |
| - } |
| 77 | + ] |
78 | 78 | },
|
79 | 79 | {
|
80 | 80 | "cell_type": "code",
|
|
84 | 84 | },
|
85 | 85 | "outputs": [],
|
86 | 86 | "source": [
|
87 |
| - "from cratedb_toolkit import ManagedCluster, InputOutputResource\n", |
| 87 | + "from cratedb_toolkit import InputOutputResource, ManagedCluster\n", |
88 | 88 | "\n",
|
89 | 89 | "cluster = ManagedCluster.from_env().start()"
|
90 | 90 | ]
|
91 | 91 | },
|
92 | 92 | {
|
93 | 93 | "cell_type": "markdown",
|
| 94 | + "metadata": { |
| 95 | + "collapsed": false |
| 96 | + }, |
94 | 97 | "source": [
|
95 | 98 | "## Import Data\n",
|
96 | 99 | "\n",
|
|
105 | 108 | "\n",
|
106 | 109 | "[NAB Data Corpus]: https://github.com/numenta/NAB/tree/master/data\n",
|
107 | 110 | "[MLflow and CrateDB]: https://github.com/crate/cratedb-examples/tree/main/topic/machine-learning/mlops-mlflow"
|
108 |
| - ], |
109 |
| - "metadata": { |
110 |
| - "collapsed": false |
111 |
| - } |
| 111 | + ] |
112 | 112 | },
|
113 | 113 | {
|
114 | 114 | "cell_type": "code",
|
115 | 115 | "execution_count": 4,
|
| 116 | + "metadata": { |
| 117 | + "collapsed": false |
| 118 | + }, |
116 | 119 | "outputs": [
|
117 | 120 | {
|
118 | 121 | "name": "stderr",
|
119 | 122 | "output_type": "stream",
|
120 | 123 | "text": [
|
121 |
| - "\u001B[36m==> Info: \u001B[0mStatus: REGISTERED (Your import job was received and is pending processing.)\n", |
122 |
| - "\u001B[36m==> Info: \u001B[0mDone importing 22.70K records\n", |
123 |
| - "\u001B[32m==> Success: \u001B[0mOperation completed.\n" |
| 124 | + "\u001b[36m==> Info: \u001b[0mStatus: REGISTERED (Your import job was received and is pending processing.)\n", |
| 125 | + "\u001b[36m==> Info: \u001b[0mDone importing 22.70K records\n", |
| 126 | + "\u001b[32m==> Success: \u001b[0mOperation completed.\n" |
124 | 127 | ]
|
125 | 128 | },
|
126 | 129 | {
|
|
140 | 143 | "# Invoke import job. Without `target` argument, the destination\n",
|
141 | 144 | "# table name will be derived from the input file name.\n",
|
142 | 145 | "cluster.load_table(source=source)"
|
143 |
| - ], |
144 |
| - "metadata": { |
145 |
| - "collapsed": false |
146 |
| - } |
| 146 | + ] |
147 | 147 | },
|
148 | 148 | {
|
149 | 149 | "cell_type": "markdown",
|
| 150 | + "metadata": { |
| 151 | + "collapsed": false |
| 152 | + }, |
150 | 153 | "source": [
|
151 | 154 | "## Query Data\n",
|
152 | 155 | "\n",
|
153 | 156 | "In order to inspect if the dataset has been imported successfully, run an SQL\n",
|
154 | 157 | "command sampling a few records."
|
155 |
| - ], |
156 |
| - "metadata": { |
157 |
| - "collapsed": false |
158 |
| - } |
| 158 | + ] |
159 | 159 | },
|
160 | 160 | {
|
161 | 161 | "cell_type": "code",
|
162 | 162 | "execution_count": 5,
|
| 163 | + "metadata": { |
| 164 | + "collapsed": false |
| 165 | + }, |
163 | 166 | "outputs": [
|
164 | 167 | {
|
165 | 168 | "data": {
|
|
173 | 176 | "source": [
|
174 | 177 | "# Query data.\n",
|
175 | 178 | "cluster.query('SELECT * FROM \"nab-machine-failure\" LIMIT 5;')"
|
176 |
| - ], |
177 |
| - "metadata": { |
178 |
| - "collapsed": false |
179 |
| - } |
| 179 | + ] |
180 | 180 | }
|
181 | 181 | ],
|
182 | 182 | "metadata": {
|
|
0 commit comments