-
Notifications
You must be signed in to change notification settings - Fork 378
Expand file tree
/
Copy pathmagic.py
More file actions
136 lines (107 loc) · 5.26 KB
/
magic.py
File metadata and controls
136 lines (107 loc) · 5.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
import re
from IPython.core.magic import Magics, magics_class, cell_magic, line_magic, needs_local_scope
try:
from traitlets.config.configurable import Configurable
from traitlets import Bool, Int, Unicode
except ImportError:
from IPython.config.configurable import Configurable
from IPython.utils.traitlets import Bool, Int, Unicode
try:
from pandas.core.frame import DataFrame, Series
except ImportError:
DataFrame = None
Series = None
from sqlalchemy.exc import ProgrammingError, OperationalError
import sql.connection
import sql.parse
import sql.run
@magics_class
class SqlMagic(Magics, Configurable):
"""Runs SQL statement on a database, specified by SQLAlchemy connect string.
Provides the %%sql magic."""
autolimit = Int(100000, config=True, help="Automatically limit the size of the returned result sets")
style = Unicode('DEFAULT', config=True, help="Set the table printing style to any of prettytable's defined styles (currently DEFAULT, MSWORD_FRIENDLY, PLAIN_COLUMNS, RANDOM)")
short_errors = Bool(True, config=True, help="Don't display the full traceback on SQL Programming Error")
displaylimit = Int(1000, config=True, help="Automatically limit the number of rows displayed (full result set is still stored)")
autopandas = Bool(False, config=True, help="Return Pandas DataFrames instead of regular result sets")
column_local_vars = Bool(False, config=True, help="Return data into local variables from column names")
feedback = Bool(True, config=True, help="Print number of rows affected by DML")
dsn_filename = Unicode('odbc.ini', config=True, help="Path to DSN file. "
"When the first argument is of the form [section], "
"a sqlalchemy connection string is formed from the "
"matching section in the DSN file.")
def __init__(self, shell):
Configurable.__init__(self, config=shell.config)
Magics.__init__(self, shell=shell)
# Add ourself to the list of module configurable via %config
self.shell.configurables.append(self)
@needs_local_scope
@line_magic('sql')
@cell_magic('sql')
def execute(self, line, cell='', local_ns={}):
"""Runs SQL statement against a database, specified by SQLAlchemy connect string.
If no database connection has been established, first word
should be a SQLAlchemy connection string, or the user@db name
of an established connection.
Examples::
%%sql postgresql://me:mypw@localhost/mydb
SELECT * FROM mytable
%%sql me@mydb
DELETE FROM mytable
%%sql
DROP TABLE mytable
SQLAlchemy connect string syntax examples:
postgresql://me:mypw@localhost/mydb
sqlite://
mysql+pymysql://me:mypw@localhost/mydb
"""
# save globals and locals so they can be referenced in bind vars
user_ns = self.shell.user_ns.copy()
user_ns.update(local_ns)
parsed = sql.parse.parse('%s\n%s' % (line, cell), self)
conn = sql.connection.Connection.get(parsed['connection'])
first_word = parsed['sql'].split(None, 1)[:1]
if first_word and first_word[0].lower() == 'persist':
return self._persist_dataframe(parsed['sql'], conn, user_ns)
try:
result = sql.run.run(conn, parsed['sql'], self, user_ns)
if result is not None and ~isinstance(result, str) and self.column_local_vars:
#Instead of returning values, set variables directly in the
#users namespace. Variable names given by column names
if self.autopandas:
keys = result.keys()
else:
keys = result.keys
result = result.dict()
if self.feedback:
print('Returning data to local variables [{}]'.format(
', '.join(keys)))
self.shell.user_ns.update(result)
return None
else:
#Return results into the default ipython _ variable
return result
except (ProgrammingError, OperationalError) as e:
# Sqlite apparently return all errors as OperationalError :/
if self.short_errors:
print(e)
else:
raise
legal_sql_identifier = re.compile(r'^[A-Za-z0-9#_$]+')
def _persist_dataframe(self, raw, conn, user_ns):
if not DataFrame:
raise ImportError("Must `pip install pandas` to use DataFrames")
pieces = raw.split()
if len(pieces) != 2:
raise SyntaxError("Format: %sql [connection] persist <DataFrameName>")
frame_name = pieces[1].strip(';')
frame = eval(frame_name, user_ns)
if not isinstance(frame, DataFrame) and not isinstance(frame, Series):
raise TypeError('%s is not a Pandas DataFrame or Series' % frame_name)
table_name = frame_name.lower()
table_name = self.legal_sql_identifier.search(table_name).group(0)
frame.to_sql(table_name, conn.session.engine)
return 'Persisted %s' % table_name
def load_ipython_extension(ip):
"""Load the extension in IPython."""
ip.register_magics(SqlMagic)