import sqlite3
conn = sqlite3.connect('example.db')
cursor = conn.cursor()

cursor.execute('''CREATE TABLE IF NOT EXISTS student
             (id, name, major, score);''')
conn.commit()

cursor.execute("DROP TABLE IF EXISTS student;")
conn.commit()

import pandas as pd
def print_student_details():
    sql_select = "SELECT * FROM student;"
    cursor.execute(sql_select)
    # 在执行数据库查询后，游标对象将访问查询返回的数据。
    # fetchall() 方法会返回查询结果的所有行，通常是以列表的形式
    result = cursor.fetchall()
    result = pd.DataFrame(result, columns=['id', 'name', 'major', 'score'])
    return(result)

sql = "INSERT INTO student (id, name, major, score) VALUES (5, 'PJ', 'CS', 85);"
cursor.execute(sql)
conn.commit()
print_student_details()

sql_delete = "DELETE FROM student WHERE name='PJ';"
cursor.execute(sql_delete)
conn.commit()
print_student_details()

students = [
    (0, 'PJ', 'CS', 85),
    (1, 'John', 'Math', 90),
    (2, 'Jane', 'Math', 85),
    (3, 'Bob', 'English', 95),
    (4, 'Alice', 'History', 80),
    (5, 'Tom', 'Art', None),
    (6, 'Mary', 'Music', 98)
]
# Insert data into table
cursor.executemany('INSERT INTO student VALUES (?,?,?,?)', students)
conn.commit()
print_student_details()

cursor.execute("UPDATE student SET score = 90 WHERE name = 'PJ'")
conn.commit()
print_student_details()

cursor.execute("SELECT * FROM student;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score'])

cursor.execute("SELECT name, score FROM student;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['name', 'score'])

cursor.execute("SELECT * FROM student WHERE score > 90;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score'])

cursor.execute("SELECT * FROM student WHERE score <> 80;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score'])

cursor.execute("SELECT * FROM student WHERE score BETWEEN 80 AND 95;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score'])

cursor.execute("SELECT * FROM student WHERE major in ('English', 'Math')")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'age','major'])

cursor.execute("SELECT * FROM student WHERE name LIKE 'J%';")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'age', 'gender'])

cursor.execute("SELECT * FROM student WHERE name LIKE 'J_hn';")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'age', 'gender'])

cursor.execute("SELECT * FROM student WHERE score is NULL;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score'])

cursor.execute("SELECT id, name, score FROM student ORDER BY score DESC;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'score'])

cursor.execute("SELECT DISTINCT major FROM student;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['Major'])

cursor.execute("SELECT major, AVG(score) FROM student GROUP BY major;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['Major', 'Mean Score'])

cursor.execute("SELECT major, AVG(score) AS avg_score FROM student \
                Group by major HAVING COUNT(*) > 1")
result = cursor.fetchall()
pd.DataFrame(result, columns=['major', 'AVG(score)'])

cursor.execute("SELECT * FROM st_info;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['name', 'age', 'gender'])

cursor.execute("SELECT * FROM student INNER JOIN st_info ON student.name=st_info.name;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score', 'name', 'age', 'gender'])

cursor.execute("SELECT * FROM student LEFT OUTER JOIN st_info ON student.name=st_info.name;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score', 'name', 'age', 'gender'])

cursor.execute("SELECT * FROM student FULL OUTER JOIN st_info ON student.name=st_info.name;")
result = cursor.fetchall()
pd.DataFrame(result, columns=['id', 'name', 'major', 'score', 'name', 'age', 'gender'])

cursor.close()
conn.close()

# sign in
import psycopg2
db_params = {
    'dbname': 'data_science',
    'user': 'postgres',
    'password': '12345678',
    'host': 'localhost',  # 数据库主机地址
    'port': '5432'        # PostgreSQL默认端口
}
conn = psycopg2.connect(**db_params)
cursor = conn.cursor()

cursor.execute("DROP TABLE IF EXISTS scores;")
conn.commit()

cursor.execute("CREATE TABLE IF NOT EXISTS scores (id INT, name VARCHAR(50), score INT)")
conn.commit()

cursor.execute("INSERT INTO scores (id, name, score) VALUES (1, 'John', 89);")
conn.commit()

import pandas as pd
cursor.execute("SELECT * FROM scores;")
results = cursor.fetchall()
pd.DataFrame(results, columns=['id', 'name', 'score'])

data = [(2, 'PJ', 78),
        (3, 'AJ', 85)]
cursor.executemany("INSERT INTO scores (id, name, score) VALUES (%s, %s, %s)", data)
conn.commit()

cursor.execute("SELECT * FROM scores;")
results = cursor.fetchall()
pd.DataFrame(results, columns=['id', 'name', 'score'])

cursor.close()
conn.close()

	name	age	gender
0	Alice	20	Female
1	Bob	22	Male
2	Charlie	21	Male
3	David	23	Male
4	Eve	22	Female
5	Frank	21	Male

	id	name	major	score	name	age	gender
0	0.0	PJ	CS	90.0	None	NaN	None
1	1.0	John	Math	90.0	None	NaN	None
2	2.0	Jane	Math	85.0	None	NaN	None
3	3.0	Bob	English	95.0	Bob	22.0	Male
4	4.0	Alice	History	80.0	Alice	20.0	Female
5	5.0	Tom	Art	NaN	None	NaN	None
6	6.0	Mary	Music	98.0	None	NaN	None
7	NaN	None	None	NaN	Charlie	21.0	Male
8	NaN	None	None	NaN	David	23.0	Male
9	NaN	None	None	NaN	Eve	22.0	Female
10	NaN	None	None	NaN	Frank	21.0	Male

Python数据处理¶

08. SQL数据库¶

上一讲：HTML、XML和JSON¶

一个更复杂的JSON对象的例子¶

为什么要使用数据库？¶

数据库（DB）¶

关系数据库的优缺点¶

ACID：原子性、一致性、隔离性、持久性¶

关系数据库的基本单位：记录¶

SQL（最初由IBM称为SEQUEL）¶

关系数据库管理系统（RDBMS）¶

SQLite数据库¶

Python sqlite3包实现了SQLlite¶

添加/删除表：创建新表或删除现有表¶

添加/删除记录：在表中插入新行或删除现有行¶

修改行¶

检索记录：在表中查找所有行¶

过滤记录：SQL WHERE语句¶

关于WHERE语句的更多信息¶

更多关于WHERE语句的信息¶

NULL匹配空字符串，¶

排序记录：SQL ORDER BY语句¶

更多过滤：DISTINCT¶

聚合结果：GROUP BY¶

更多关于`GROUP BY`的信息¶

合并表：JOIN¶

其他合并表的方式：OUTER JOIN¶

SQLite和PostgreSQL对比¶

psycopg2¶

Python数据处理¶

08. SQL数据库¶

上一讲：HTML、XML和JSON¶

一个更复杂的JSON对象的例子¶

为什么要使用数据库？¶

数据库（DB）¶

关系数据库的优缺点¶

ACID：原子性、一致性、隔离性、持久性¶

关系数据库的基本单位：记录¶

SQL（最初由IBM称为SEQUEL）¶

关系数据库管理系统（RDBMS）¶

SQLite数据库¶

Python sqlite3包实现了SQLlite¶

添加/删除表：创建新表或删除现有表¶

添加/删除记录：在表中插入新行或删除现有行¶

修改行¶

检索记录：在表中查找所有行¶

过滤记录：SQL WHERE语句¶

关于WHERE语句的更多信息¶

更多关于WHERE语句的信息¶

NULL匹配空字符串，¶

排序记录：SQL ORDER BY语句¶

更多过滤：DISTINCT¶

聚合结果：GROUP BY¶

更多关于GROUP BY的信息¶

合并表：JOIN¶

其他合并表的方式：OUTER JOIN¶

SQLite和PostgreSQL对比¶

psycopg2¶

更多关于`GROUP BY`的信息¶