diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..3664824 --- /dev/null +++ b/.gitignore @@ -0,0 +1,9 @@ +**/.DS_Store +**/*.ipynb_checkpoints/ +_site/* +_staffers/sheets_parser.json +.DS_Store +.*.swp +.*.swo +DS_Store +.bundle diff --git a/_site/acks/index.html b/_site/acks/index.html index 3dbf943..0792b31 100644 --- a/_site/acks/index.html +++ b/_site/acks/index.html @@ -1 +1 @@ - Acknowledgments | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Course Acknowledgments

The content and structure of Data 100 have been designed and developed over the years thanks to many dedicated faculty and instructors at UC Berkeley.

The Learning Data Science textbook that this course follows is authored by Sam Lau, Joseph Gonzalez, and Deborah Nolan.

Valuable and essential instructional contributors (alphabetical order): Ani Adhikari, Andrew Bray, John DeNero, Will Fithian, Josh Hug, Narges Norouzi, Fernando Pérez, Suraj Rampure, Allen Shen, Alvin Wan, and Lisa Yan.

+ Acknowledgments | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Course Acknowledgments

The content and structure of Data 100 have been designed and developed over the years thanks to many dedicated faculty and instructors at UC Berkeley.

The Learning Data Science textbook that this course follows is authored by Sam Lau, Joseph Gonzalez, and Deborah Nolan.

Valuable and essential instructional contributors (alphabetical order): Ani Adhikari, Andrew Bray, John DeNero, Will Fithian, Josh Hug, Narges Norouzi, Fernando Pérez, Suraj Rampure, Allen Shen, Alvin Wan, and Lisa Yan.

diff --git a/_site/announcements/index.html b/_site/announcements/index.html index 7821531..481444e 100644 --- a/_site/announcements/index.html +++ b/_site/announcements/index.html @@ -1 +1 @@ - Announcements | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Announcements

Announcements are stored in the _announcements directory and rendered according to the layout file, _layouts/announcement.html.

+ Announcements | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Announcements

Announcements are stored in the _announcements directory and rendered according to the layout file, _layouts/announcement.html.

diff --git a/_site/assets/css/just-the-docs-dark.css b/_site/assets/css/just-the-docs-dark.css index 3417639..7f6814f 100644 --- a/_site/assets/css/just-the-docs-dark.css +++ b/_site/assets/css/just-the-docs-dark.css @@ -429,7 +429,7 @@ blockquote { margin: 10px 0; margin-block-start: 0; margin-inline-start: 0; padd @media (min-width: 31.25rem) { .site-title { font-size: 24px !important; line-height: 1.25; } } @media (min-width: 50rem) { .site-title { padding-top: 0.5rem; padding-bottom: 0.5rem; } } -.site-logo { width: 100%; height: 100%; background-image: url("/su23/resources/assets/favicon/panda-logo.png"); background-repeat: no-repeat; background-position: left center; background-size: contain; } +.site-logo { width: 100%; height: 100%; background-image: url("/fa23-testing/resources/assets/favicon/panda-logo.png"); background-repeat: no-repeat; background-position: left center; background-size: contain; } .site-button { display: flex; height: 100%; padding: 1rem; align-items: center; } diff --git a/_site/assets/css/just-the-docs-default.css b/_site/assets/css/just-the-docs-default.css index 9d8aee0..838d37e 100644 --- a/_site/assets/css/just-the-docs-default.css +++ b/_site/assets/css/just-the-docs-default.css @@ -301,7 +301,7 @@ blockquote { margin: 10px 0; margin-block-start: 0; margin-inline-start: 0; padd @media (min-width: 31.25rem) { .site-title { font-size: 24px !important; line-height: 1.25; } } @media (min-width: 50rem) { .site-title { padding-top: 0.5rem; padding-bottom: 0.5rem; } } -.site-logo { width: 100%; height: 100%; background-image: url("/su23/resources/assets/favicon/panda-logo.png"); background-repeat: no-repeat; background-position: left center; background-size: contain; } +.site-logo { width: 100%; height: 100%; background-image: url("/fa23-testing/resources/assets/favicon/panda-logo.png"); background-repeat: no-repeat; background-position: left center; background-size: contain; } .site-button { display: flex; height: 100%; padding: 1rem; align-items: center; } diff --git a/_site/assets/css/just-the-docs-light.css b/_site/assets/css/just-the-docs-light.css index 5f0e94f..b73a5e1 100644 --- a/_site/assets/css/just-the-docs-light.css +++ b/_site/assets/css/just-the-docs-light.css @@ -301,7 +301,7 @@ blockquote { margin: 10px 0; margin-block-start: 0; margin-inline-start: 0; padd @media (min-width: 31.25rem) { .site-title { font-size: 24px !important; line-height: 1.25; } } @media (min-width: 50rem) { .site-title { padding-top: 0.5rem; padding-bottom: 0.5rem; } } -.site-logo { width: 100%; height: 100%; background-image: url("/su23/resources/assets/favicon/panda-logo.png"); background-repeat: no-repeat; background-position: left center; background-size: contain; } +.site-logo { width: 100%; height: 100%; background-image: url("/fa23-testing/resources/assets/favicon/panda-logo.png"); background-repeat: no-repeat; background-position: left center; background-size: contain; } .site-button { display: flex; height: 100%; padding: 1rem; align-items: center; } diff --git a/_site/assets/js/just-the-docs.js b/_site/assets/js/just-the-docs.js index 82d29bf..332944c 100644 --- a/_site/assets/js/just-the-docs.js +++ b/_site/assets/js/just-the-docs.js @@ -55,7 +55,7 @@ function initNav() { function initSearch() { var request = new XMLHttpRequest(); - request.open('GET', '/su23/assets/js/search-data.json', true); + request.open('GET', '/fa23-testing/assets/js/search-data.json', true); request.onload = function(){ if (request.status >= 200 && request.status < 400) { @@ -434,7 +434,7 @@ jtd.getTheme = function() { jtd.setTheme = function(theme) { var cssFile = document.querySelector('[rel="stylesheet"]'); - cssFile.setAttribute('href', '/su23/assets/css/just-the-docs-' + theme + '.css'); + cssFile.setAttribute('href', '/fa23-testing/assets/css/just-the-docs-' + theme + '.css'); } // Scroll site-nav to ensure the link to the current page is visible diff --git a/_site/assets/js/search-data.json b/_site/assets/js/search-data.json index c08de0b..ac4cee3 100644 --- a/_site/assets/js/search-data.json +++ b/_site/assets/js/search-data.json @@ -2,581 +2,581 @@ "doc": "Staff Pictures", "title": "Staff Pictures", "content": "Staff pictures go here . ", - "url": "/su23/resources/assets/staff_pics/README/", + "url": "/fa23-testing/resources/assets/staff_pics/README/", "relUrl": "/resources/assets/staff_pics/README/" },"1": { "doc": "Acknowledgments", "title": "Course Acknowledgments", "content": "The content and structure of Data 100 have been designed and developed over the years thanks to many dedicated faculty and instructors at UC Berkeley. The Learning Data Science textbook that this course follows is authored by Sam Lau, Joseph Gonzalez, and Deborah Nolan. Valuable and essential instructional contributors (alphabetical order): Ani Adhikari, Andrew Bray, John DeNero, Will Fithian, Josh Hug, Narges Norouzi, Fernando Pérez, Suraj Rampure, Allen Shen, Alvin Wan, and Lisa Yan. ", - "url": "/su23/acks/#course-acknowledgments", + "url": "/fa23-testing/acks/#course-acknowledgments", "relUrl": "/acks/#course-acknowledgments" },"2": { "doc": "Acknowledgments", "title": "Acknowledgments", "content": " ", - "url": "/su23/acks/", + "url": "/fa23-testing/acks/", "relUrl": "/acks/" },"3": { "doc": "Announcements", "title": "Announcements", "content": "Announcements are stored in the _announcements directory and rendered according to the layout file, _layouts/announcement.html. ", - "url": "/su23/announcements/", + "url": "/fa23-testing/announcements/", "relUrl": "/announcements/" },"4": { "doc": "Calendar", "title": "Calendar", "content": ". | Office Hours Calendar | Lecture, Discussion, and Special Events Calendar | . Note: If you are having trouble viewing the calendars below and are using Safari, we suggest switching to an alternate browser (like Chrome). Alternatively, you can go to Safari settings and switch “Prevent cross-site tracking” off, or you can see the first calendar here and the second calendar here. ", - "url": "/su23/calendar/", + "url": "/fa23-testing/calendar/", "relUrl": "/calendar/" },"5": { "doc": "Calendar", "title": "Office Hours Calendar", "content": "In-person office hours are in blue, click on each event to see which GSI and/or reader is running each office hour time. You should come to these with questions about anything – labs, homeworks, discussions, concepts, etc. Note: All office hours will be held in-person in Warren Hall 101B. Instructor office hours with Bella and Dominic appear in red. You should come to these with questions about concepts. ", - "url": "/su23/calendar/#office-hours-calendar", + "url": "/fa23-testing/calendar/#office-hours-calendar", "relUrl": "/calendar/#office-hours-calendar" },"6": { "doc": "Calendar", "title": "Lecture, Discussion, and Special Events Calendar", "content": "This calendar contains times for . | live lectures (in brown) | live discussion sections (in orange) | live exam prep and other reviews (in green) | . ", - "url": "/su23/calendar/#lecture-discussion-and-special-events-calendar", + "url": "/fa23-testing/calendar/#lecture-discussion-and-special-events-calendar", "relUrl": "/calendar/#lecture-discussion-and-special-events-calendar" },"7": { "doc": "Home / Schedule", "title": "Data 100: Principles and Techniques of Data Science", - "content": "UC Berkeley, Summer 2023 . Ed Datahub Gradescope Extenuating Circumstances . Bella Crouch She/Her/Hers . isabella.crouch@berkeley.edu . Office Hours: Tue, Th 3-4pm (Warren 111) . Dominic Liu He/Him/His . hangxingliu@berkeley.edu . Office Hours: Mon, Wed 3-4pm (Warren 111) . Welcome to Week 8! . ", - "url": "/su23/#data-100-principles-and-techniques-of-data-science", + "content": "UC Berkeley, Fall 2023 . Ed Datahub Gradescope Extenuating Circumstances . Fernando Pérez He/Him/His . fernando.perez@berkeley.edu . Narges Norouzi She/Her/Hers . norouzi@berkeley.edu . Announcements: . ", + "url": "/fa23-testing/#data-100-principles-and-techniques-of-data-science", "relUrl": "/#data-100-principles-and-techniques-of-data-science" },"8": { "doc": "Home / Schedule", "title": "Schedule", "content": " ", - "url": "/su23/#schedule", + "url": "/fa23-testing/#schedule", "relUrl": "/#schedule" },"9": { "doc": "Home / Schedule", "title": "Week 1", "content": "Jun 20 Lecture 1 Course Overview Note 1 Lab 1 Prerequisite Coding (due Jun 24) Homework 1A Plotting and the Permutation Test (due Jun 26) Homework 1B Prerequisite Math (due Jun 26) Jun 21 Lecture 2 Pandas I Note 2 Discussion 1 Math Prerequisites Solution Jun 22 Lecture 3 Pandas II Note 3 ", - "url": "/su23/#week-1", + "url": "/fa23-testing/#week-1", "relUrl": "/#week-1" },"10": { "doc": "Home / Schedule", "title": "Week 2", "content": "Jun 26 Lecture 4 Pandas III, EDA I Note 4 Discussion 2 Pandas worksheet, worksheet notebook, groupwork notebook Solution Lab 2 Pandas (due Jul 1) Lab 3 Data Cleaning and EDA (due Jul 1) Homework 2 Pandas (due Jun 29) Jun 27 Lecture 5 EDA II Note 5 Jun 28 Lecture 6 Text Wrangling, Regex Note 6 Discussion 3 EDA Solution Jun 29 Lecture 7 Visualization Note 7 Homework 3 Tweets (due Jul 3) Jun 30 Exam Prep 1 Pandas Solution ", - "url": "/su23/#week-2", + "url": "/fa23-testing/#week-2", "relUrl": "/#week-2" },"11": { "doc": "Home / Schedule", "title": "Week 3", "content": "Jul 3 Break (no lecture) Discussion 4 Regex (optional) Solution, Video Walkthrough Lab 4 Transformation (due Jul 8) Lab 5 Modeling, Summary Statistics, Loss Functions (due Jul 8) Homework 4 Bike Sharing (Visualization) (due Jul 6) Jul 4 Independence Day (no lecture) Jul 5 Lecture 8 Sampling Note 8 Discussion 5 Visualization Worksheet, Notebook Solution Jul 6 Lecture 9 Modeling, SLR Note 9 Homework 5A Sampling (due Jul 10) Homework 5B Modeling (due Jul 10) Jul 7 Exam Prep 2 Regex, KDE Plots Solution ", - "url": "/su23/#week-3", + "url": "/fa23-testing/#week-3", "relUrl": "/#week-3" },"12": { "doc": "Home / Schedule", "title": "Week 4", "content": "Jul 10 Lecture 10 Constant model, loss, and transformations Note 10 Discussion 6 Sampling, SLR Solution Lab 6 Ordinary Least Squares (due Jul 15) Lab 7 Gradient Descent, Feature Engineering (due Jul 15) Homework 6 Regression (due Jul 13) Jul 11 Lecture 11 Ordinary Least Squares (Multiple Linear Regression) Note 11 Jul 12 Lecture 12 Gradient Descent Note 12 Discussion 7 Transformations, OLS Solution Jul 13 Lecture 13 Sklearn, Feature Engineering Note 13 Project A1 Housing I (due Jul 17) ", - "url": "/su23/#week-4", + "url": "/fa23-testing/#week-4", "relUrl": "/#week-4" },"13": { "doc": "Home / Schedule", "title": "Week 5", "content": "Jul 17 Lecture 14 Case Study in Human Contexts and Ethics (CCAO) Note 14 Discussion 8 Gradient Descent, Feature Engineering Solution Lab 8 Model Selection (due Jul 22) Project A2 Housing II (due Jul 24) Jul 18 Lecture 15 Cross-Validation, Regularization Note 15 Jul 19 Break (no lecture) Discussion 9 Exam Review Jul 20 Midterm Midterm Exam (5-7 PM) ", - "url": "/su23/#week-5", + "url": "/fa23-testing/#week-5", "relUrl": "/#week-5" },"14": { "doc": "Home / Schedule", "title": "Week 6", "content": "Jul 24 Lecture 16 Random Variables Note 16 Discussion 10 Cross-Validation, Regularization Solution Lab 9 Probability (due Jul 29) Lab 10 Logistic Regression (due Jul 29) Homework 7 Probability and Estimators (due Jul 27) Jul 25 Lecture 17 Estimators, Bias, and Variance Note 17 Jul 26 Lecture 18 Logistic Regression I Note 18 Discussion 11 Random Variables, BVT Solution Jul 27 Lecture 19 Logistic Regression II Note 19 Project B1 Spam & Ham I (due Jul 31) Jul 28 Exam Prep 3 Regularization, Bias-Variance Tradeoff, Cross-Validation, Random Variables Solution ", - "url": "/su23/#week-6", + "url": "/fa23-testing/#week-6", "relUrl": "/#week-6" },"15": { "doc": "Home / Schedule", "title": "Week 7", "content": "Jul 31 Lecture 20 SQL I Note 20 Discussion 12 Logistic Regression Solution Lab 11 SQL (due Aug 5) Lab 12 PCA (due Aug 5) Project B2 Spam & Ham II (due Aug 3) Aug 1 Lecture 21 SQL II Note 21 Aug 2 Lecture 22 PCA I Note 22 Discussion 13 SQL Solution Aug 3 Lecture 23 PCA II Note 23 Homework 8 SQL, PCA (due Aug 7) ", - "url": "/su23/#week-7", + "url": "/fa23-testing/#week-7", "relUrl": "/#week-7" },"16": { "doc": "Home / Schedule", "title": "Week 8", "content": "Aug 7 Lecture 24 Decision Trees Note 24 Discussion 14 PCA Solution Lab 13 Decision Trees (optional) Aug 8 Lecture 25 Conclusion Aug 9 Break (no lecture) Discussion 15 Decision Trees, Final Review Aug 10 Final Final Exam (5-7 PM) ", - "url": "/su23/#week-8", + "url": "/fa23-testing/#week-8", "relUrl": "/#week-8" },"17": { "doc": "Home / Schedule", "title": "Home / Schedule", "content": " ", - "url": "/su23/", + "url": "/fa23-testing/", "relUrl": "/" },"18": { "doc": "Lecture 1 – Course Overview", "title": "Lecture 1 – Introduction", "content": "Presented by Bella Crouch and Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec01/#lecture-1--introduction", + "url": "/fa23-testing/lecture/lec01/#lecture-1--introduction", "relUrl": "/lecture/lec01/#lecture-1--introduction" },"19": { "doc": "Lecture 1 – Course Overview", "title": "Lecture 1 – Course Overview", "content": " ", - "url": "/su23/lecture/lec01/", + "url": "/fa23-testing/lecture/lec01/", "relUrl": "/lecture/lec01/" },"20": { "doc": "Lecture 2 – Pandas, Part I", "title": "Lecture 2 – Pandas, Part I", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | code (Data 8) | code HTML (Data 8) | recording | . ", - "url": "/su23/lecture/lec02/", + "url": "/fa23-testing/lecture/lec02/", "relUrl": "/lecture/lec02/" },"21": { "doc": "Lecture 3 – Pandas, Part II", "title": "Lecture 3 – Pandas, Part II", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec03/", + "url": "/fa23-testing/lecture/lec03/", "relUrl": "/lecture/lec03/" },"22": { "doc": "Lecture 4 – Pandas, Part III and EDA, Part I", "title": "Lecture 4 – Pandas, Part III and EDA, Part I", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | Pandas Demo (HTML) | EDA Demo (HTML) | recording | . ", - "url": "/su23/lecture/lec04/", + "url": "/fa23-testing/lecture/lec04/", "relUrl": "/lecture/lec04/" },"23": { "doc": "Lecture 5 – EDA II", "title": "Lecture 5 – EDA II", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec05/", + "url": "/fa23-testing/lecture/lec05/", "relUrl": "/lecture/lec05/" },"24": { "doc": "Lecture 6 – Text Wrangling and Regex", "title": "Lecture 6 – Text Wrangling and Regex", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording . | The screen is blank for the first 15 minutes of the recording, please follow along with the slides. Sorry for any inconvenience. | You can also watch the last 12 minutes of the Data 100 (Spring 2023) Lecture 5 recording. | . | . ", - "url": "/su23/lecture/lec06/", + "url": "/fa23-testing/lecture/lec06/", "relUrl": "/lecture/lec06/" },"25": { "doc": "Lecture 7 – Visualization", "title": "Lecture 7 – Visualization", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec07/", + "url": "/fa23-testing/lecture/lec07/", "relUrl": "/lecture/lec07/" },"26": { "doc": "Lecture 8 – Sampling", "title": "Lecture 8 – Sampling", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec08/", + "url": "/fa23-testing/lecture/lec08/", "relUrl": "/lecture/lec08/" },"27": { "doc": "Lecture 9 – Modeling, SLR", "title": "Lecture 9 – Modeling, SLR", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | recording | . ", - "url": "/su23/lecture/lec09/", + "url": "/fa23-testing/lecture/lec09/", "relUrl": "/lecture/lec09/" },"28": { "doc": "Lecture 10 – Constant model, loss, and transformations", "title": "Lecture 10 – Constant model, loss, and transformations", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec10/", + "url": "/fa23-testing/lecture/lec10/", "relUrl": "/lecture/lec10/" },"29": { "doc": "Lecture 11 – Ordinary Least Squares", "title": "Lecture 11 – Ordinary Least Squares", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec11/", + "url": "/fa23-testing/lecture/lec11/", "relUrl": "/lecture/lec11/" },"30": { "doc": "Lecture 12 – Gradient Descent", "title": "Lecture 12 – Gradient Descent", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec12/", + "url": "/fa23-testing/lecture/lec12/", "relUrl": "/lecture/lec12/" },"31": { "doc": "Lecture 13 – Sklearn, Feature Engineering", "title": "Lecture 13 – Sklearn, Feature Engineering", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec13/", + "url": "/fa23-testing/lecture/lec13/", "relUrl": "/lecture/lec13/" },"32": { "doc": "Lecture 14 – Case Study in Human Contexts and Ethics (CCAO)", "title": "Lecture 14 – Case Study in Human Contexts and Ethics (CCAO)", "content": "Presented by Ari Edmundson . | slides | case study article | recording | . ", - "url": "/su23/lecture/lec14/", + "url": "/fa23-testing/lecture/lec14/", "relUrl": "/lecture/lec14/" },"33": { "doc": "Lecture 15 – Cross-Validation, Regularization", "title": "Lecture 15 – Cross-Validation, Regularization", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec15/", + "url": "/fa23-testing/lecture/lec15/", "relUrl": "/lecture/lec15/" },"34": { "doc": "Lecture 16 – Random Variables", "title": "Lecture 16 – Random Variables", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec16/", + "url": "/fa23-testing/lecture/lec16/", "relUrl": "/lecture/lec16/" },"35": { "doc": "Lecture 17 – Model Bias, Variance, and Inference", "title": "Lecture 17 – Model Bias, Variance, and Inference", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec17/", + "url": "/fa23-testing/lecture/lec17/", "relUrl": "/lecture/lec17/" },"36": { "doc": "Lecture 18 – Logistic Regression I", "title": "Lecture 18 – Logistic Regression I", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec18/", + "url": "/fa23-testing/lecture/lec18/", "relUrl": "/lecture/lec18/" },"37": { "doc": "Lecture 19 – Logistic Regression II", "title": "Lecture 19 – Logistic Regression II", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec19/", + "url": "/fa23-testing/lecture/lec19/", "relUrl": "/lecture/lec19/" },"38": { "doc": "Lecture 20 – SQL I", "title": "Lecture 20 – SQL I", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec20/", + "url": "/fa23-testing/lecture/lec20/", "relUrl": "/lecture/lec20/" },"39": { "doc": "Lecture 21 – SQL II", "title": "Lecture 21 – SQL II", "content": "Presented by Bella Crouch . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec21/", + "url": "/fa23-testing/lecture/lec21/", "relUrl": "/lecture/lec21/" },"40": { "doc": "Lecture 22 – PCA I", "title": "Lecture 22 – PCA I", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec22/", + "url": "/fa23-testing/lecture/lec22/", "relUrl": "/lecture/lec22/" },"41": { "doc": "Lecture 23 – PCA II", "title": "Lecture 23 – PCA II", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | PCA II code HTML | Fashion MNIST code HTML | recording | . ", - "url": "/su23/lecture/lec23/", + "url": "/fa23-testing/lecture/lec23/", "relUrl": "/lecture/lec23/" },"42": { "doc": "Lecture 24 – Decision trees", "title": "Lecture 24 - Decision Trees", "content": "Presented by Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | code | code HTML | recording | . ", - "url": "/su23/lecture/lec24/#lecture-24---decision-trees", + "url": "/fa23-testing/lecture/lec24/#lecture-24---decision-trees", "relUrl": "/lecture/lec24/#lecture-24---decision-trees" },"43": { "doc": "Lecture 24 – Decision trees", "title": "Lecture 24 – Decision trees", "content": " ", - "url": "/su23/lecture/lec24/", + "url": "/fa23-testing/lecture/lec24/", "relUrl": "/lecture/lec24/" },"44": { "doc": "Lecture 25 – Conclusion", "title": "Lecture 25 - Conclusion", "content": "Presented by Bella Crouch and Dominic Liu . Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page. | slides | recording | . ", - "url": "/su23/lecture/lec25/#lecture-25---conclusion", + "url": "/fa23-testing/lecture/lec25/#lecture-25---conclusion", "relUrl": "/lecture/lec25/#lecture-25---conclusion" },"45": { "doc": "Lecture 25 – Conclusion", "title": "Lecture 25 – Conclusion", "content": " ", - "url": "/su23/lecture/lec25/", + "url": "/fa23-testing/lecture/lec25/", "relUrl": "/lecture/lec25/" },"46": { "doc": "Resources", "title": "Resources", "content": "Here is a collection of resources that will help you learn more about various concepts and skills covered in the class. Learning by reading is a key part of being a well rounded data scientist. We will not assign mandatory reading but instead encourage you to look at these and other materials. If you find something helpful, post it on EdStem, and consider contributing it to the course website. Jump to: . | Supplementary Course Notes | Optional Supplementary Textbook | Exam Resources | Course Website | Coding and Mathematics Resources . | Pandas | SQL | Regex | LaTeX | Other Web References | Calculus and Linear Algebra | Probability | . | Books | Wellness Resources | Data Science Education | Local Setup (Old) | . ", - "url": "/su23/resources/", + "url": "/fa23-testing/resources/", "relUrl": "/resources/" },"47": { "doc": "Resources", "title": "Supplementary Course Notes", "content": "Alongside each lecture are supplementary Course Notes. Lecture notes will be updated on a weekly basis, prior to the lecture. If you spot any errors or would like to suggest any changes, please email us at data100.instructors@berkeley.edu. ", - "url": "/su23/resources/#supplementary-course-notes", + "url": "/fa23-testing/resources/#supplementary-course-notes", "relUrl": "/resources/#supplementary-course-notes" },"48": { "doc": "Resources", "title": "Optional Supplementary Textbook", "content": "Alongside each lecture are optional textbook readings to the Data 100 textbook, Principles and Techniques of Data Science. Textbook readings are purely supplementary, and may contain material that is not in scope (and may also not be comprehensive). ", - "url": "/su23/resources/#optional-supplementary-textbook", + "url": "/fa23-testing/resources/#optional-supplementary-textbook", "relUrl": "/resources/#optional-supplementary-textbook" },"49": { "doc": "Resources", "title": "Exam Resources", "content": "| Semester | Midterm (1) | Midterm 2 | Final | Reference Sheet | . | Summer 2023 | Exam (Solutions) |   | Exam (Solutions) | Midterm, Final | . | Spring 2023 | Exam (Solutions) |   | Exam (Solutions) | Midterm, Final | . | Fall 2022 | Exam (Solutions) |   |   | Midterm | . | Summer 2022 | Exam (Solutions) |   | Exam (Solutions) | Midterm, Final | . | Spring 2022 | Exam (Solutions) | Exam (Solutions) | Exam (Solutions) | Midterm 1, Midterm 2, Final | . | Fall 2021 | Exam (Solutions) |   |   |   | . | Summer 2021 | Exam (Solutions) [Video] |   | Exam (Solutions) |   | . | Spring 2021 | Exam (Solutions) |   | Exam (Solutions) |   | . | Fall 2020 | Exam (Solutions) |   | Exam (Solutions) |   | . | Summer 2020 | Exam (Solutions) | Exam (Solutions) | Exam (Solutions) |   | . | Spring 2020 | Checkpoint (Solutions) |   | N/A | Checkpoint | . | Fall 2019 | Exam (Solutions) | Exam (Solutions) | Exam (Solutions) | Midterm 1 | . | Summer 2019 | Exam (Solutions) [Video] |   | Exam (Solutions) |   | . | Spring 2019 | Exam (Solutions) [Video] | Exam (Solutions) [Video] | Exam (Solutions) | Midterm 1 | . | Fall 2018 | Exam (Solutions) |   | Exam (Solutions) |   | . | Spring 2018 | Exam (Solutions) |   | Exam (Solutions) [Video] |   | . | Fall 2017 | Exam (Solutions) [Video] |   | Exam (Solutions) |   | . | Spring 2017 | Exam (Solutions) |   | Exam (Solutions) |   | . ", - "url": "/su23/resources/#exam-resources", + "url": "/fa23-testing/resources/#exam-resources", "relUrl": "/resources/#exam-resources" },"50": { "doc": "Resources", "title": "Course Website", "content": "We will be posting all lecture materials on the course syllabus. In addition, they will also be listed in the following publicly visible Github Repo. You can send us changes to the course website by forking and sending a pull request to the course website github repository. You will then become part of the history of Data 100 at Berkeley. ", - "url": "/su23/resources/#course-website", + "url": "/fa23-testing/resources/#course-website", "relUrl": "/resources/#course-website" },"51": { "doc": "Resources", "title": "Coding and Mathematics Resources", "content": "Pandas . | DS100 Textbook Pandas Reference Table | Pandas API Reference | The Pandas Cookbook: This provides a nice overview of some of the basic Pandas functions. However, it is slightly out of date. | Learn Pandas A set of lessons providing an overview of the Pandas library. | Python for Data Science Another set of notebook demonstrating Pandas functionality. | . SQL . | We’ve assembled some SQL Review Slides to help you brush up on SQL. | We’ve also compiled a list of SQL practice problems, which can be found here, along with their solutions. | This SQL Cheat Sheet is an awesome resource that was created by Luke Harrison, a former Data 100 student. | . Regex . | Regex101.com. Remember to select the Python flavour of Regex! | DS100 Reference Sheet | We’ve organized some regular expressions(regex) problems to help you get extra practice on regex in a notebook format. They can be found here, along with their solutions. | The official Python3 regex guide is good: link | . LaTeX . | Quick Guide to Overleaf and LaTeX | . Other Web References . As a data scientist you will often need to search for information on various libraries and tools. In this class we will be using several key python libraries. Here are their documentation pages: . | Python: . | DS100 Textbook scikit-learn Reference Table | Python Tutorial: Teach yourself python. This is a pretty comprehensive tutorial. | Python + Numpy Tutorial this tutorial provides a great overview of a lot of the functionality we will be using in DS100. | Python 101: A notebook demonstrating a lot of python functionality with some (minimal explanation). | . | Data Visualization: . | DS100 Textbook Seaborn Reference Table and Matplotlib Reference Table | matplotlib.pyplot tutorial: This short tutorial provides an overview of the basic plotting utilities we will be using. | Pandas Tutor. | Kernel Density Visualization. | Altair Documentation: Altair(Vega-Lite) is a new and powerful visualization library. We might not get to teach it this semester, but you should check it out if you are interested in pursuing visualization deeper. In particular, you should find the example gallery helpful. | Prof. Jeff Heer’s Visualization Curriculum: This repository contains a series of Python-based Jupyter notebooks that teaches data visualization using Vega-Lite and Altair. | If you are interested in learning more about data visualization, you can find more materials in: . | Edward Tufte’s book sequences – a classic! | Prof. Heer’s class. | . | . | . Calculus and Linear Algebra . Note: None of these resources are meant to be a substitute for the appropriate requirement / co-requisite (Math 54, etc.). If you have no familiarity whatsoever with either of these topics, these may not be adequate and we strongly recommend spending time covering the prerequisite material yourself. We will assume that you have prior knowledge of these requirements and that these resources are simply to refresh your memory of concepts that you have previously learned. Please reach out to staff if you have any questions or concerns about this. Calculus: In terms of calculus, you will need to know a few things, most of which are covered within the space of the first homework and lab. Specifically, you will need to know univariate calculus rules like: Taking derivatives of a univariate function (i.e. f(x), where x is the only variable); Derivative power rule; Knowing derivatives of mathematical functions like: sinx,cosx,logx,ex; Chain rule; Product rule (rarely); Derivatives of sums. We will expect some multivariate fluency like: Taking partial derivatives of a multivariate function (i.e. f(x,y,z), where x,y,z are all variables); Gradients (the concept). | Khan Academy: Derivatives, Definitions, and Basic Rules; Multivariable Derivatives . | Math 53: Derivatives of Vector Functions . | . Linear Algebra: . Concepts roughly in order of importance: vectors, matrices; rank/nullity; inner products, orthogonality, norms; linear independence; orthonormal matrices; vector spaces; projections; invertibility. | EE16A notes/assignments: Vector and Matrix Operations (Note 2A, Note 2B); Span, Linear Dependence/Independence (Note 3); Linear Transformations (Note 5); Matrix Inversion (Note 6); Vector Subspaces (Note 6); Inner Products (Note 21); Least Squares (Note 23); | Math 54: Prof. Alex Paulin Video Lectures | Data 100 textbook: Geometric Perspective of Linear Projection (Chapter 15); Vector Spaces (Appendix 2) | 3blue1brown: Essence of Linear Algebra | Khan Academy: Linear Algebra | MIT OpenCourseware: Linear Algebra Video Lectures | . Probability . | We’ve compiled a few practice probability problems that we believe may help in understanding the ideas covered in the course. They can be found here, along with their solutions. | We’d also like to point you to the textbook for Data C88S, an introductory probability course geared towards data science students at Berkeley. | . ", - "url": "/su23/resources/#coding-and-mathematics-resources", + "url": "/fa23-testing/resources/#coding-and-mathematics-resources", "relUrl": "/resources/#coding-and-mathematics-resources" },"52": { "doc": "Resources", "title": "Books", "content": "Because data science is a relatively new and rapidly evolving discipline there is no single ideal textbook for this subject. Instead we plan to use reading from a collection of books all of which are free. However, we have listed a few optional books that will provide additional context for those who are interested. | Principles and Techniques of Data Science, the Data 100 textbook. | Introduction to Statistical Learning (Free online PDF) This book is a great reference for the machine learning and some of the statistics material in the class . | Data Science from Scratch (Available as eBook for Berkeley students) This more applied book covers many of the topics in this class using Python but doesn’t go into sufficient depth for some of the more mathematical material. | Doing Data Science (Available as eBook for Berkeley students) This books provides a unique case-study view of data science but uses R and not Python. | Python for Data Analysis (Available as eBook for Berkeley students). This book provides a good reference for the Pandas library. | . ", - "url": "/su23/resources/#books", + "url": "/fa23-testing/resources/#books", "relUrl": "/resources/#books" },"53": { "doc": "Resources", "title": "Wellness Resources", "content": "Your well-being matters, and we hope that Data 100 is never a barrier to taking care of your mental and physical health. Below are some campus resources that may be helpful. COVID-19 Resources and Support . You can find UC Berkeley’ COVID-19 resources and support here. For academic performance, support, and technology . The Center for Access to Engineering Excellence (Bechtel Engineering Center 227) is an inclusive center that offers study spaces, nutritious snacks, and tutoring in >50 courses for Berkeley engineers and other majors across campus. The Center also offers a wide range of professional development, leadership, and wellness programs, and loans iclickers, laptops, and professional attire for interviews. As the primary academic support service for undergraduates at UC Berkeley, the Student Learning Center (510-642-7332) assists students in transitioning to Cal, navigating the academic terrain, creating networks of resources, and achieving academic, personal, and professional goals. Through various services including tutoring, study groups, workshops, and courses, SLC supports undergraduate students in Biological and Physical Sciences, Business Administration, Computer Science, Economics, Mathematics, Social Sciences, Statistics, Study Strategies, and Writing. The Educational Opportunity Program (EOP, Cesar Chavez Student Center 119; 510-642-7224) at Cal has provided first generation and low income college students with the guidance and resources necessary to succeed at the best public university in the world. EOP’s individualized academic counseling, support services, and extensive campus referral network help students develop the unique gifts and talents they each bring to the university while empowering them to achieve. Students can access device lending options through the Student Technology Equity Program (STEP) program. For mental well-being . The staff of the UHS Counseling and Psychological Services (Tang Center, 2222 Bancroft Way; 510-642-9494; for after-hours support, please call the 24/7 line at 855-817-5667) provides confidential, brief counseling and crisis intervention to students with personal, academic and career stress. Services are provided by a multicultural group of professional counselors including psychologists, social workers, and advanced level trainees. All undergraduate and graduate students are eligible for CAPS services, regardless of insurance coverage. To improve access for engineering students, a licensed psychologist from the Tang Center also holds walk-in appointments for confidential counseling in Bechtel Engineering Center 241 (check here for schedule). For disability accommodations . The Disabled Students’ Program (DSP, 260 César Chávez Student Center #4250; 510-642-0518) serves students with disabilities of all kinds, including mobility impairments, blind or low vision, deaf or hard of hearing; chronic illnesses (chronic pain, repetitive strain injuries, brain injuries, AIDS/HIV, cancer, etc.) psychological disabilities (bipolar disorder, severe anxiety or depression, etc.), Attention Deficit Disorder/Attention Deficit Hyperactivity Disorder, and Learning Disabilities. Services are individually designed and based on the specific needs of each student as identified by DSP’s Specialists. The Program’s official website includes information on DSP staff, UCB’s disabilities policy, application procedures, campus access guides for most university buildings, and portals for students and faculty. For solving a dispute . The Ombudsperson for Students (Sproul Hall 102; 510-642-5754) provides a confidential service for students involved in a University-related problem (academic or administrative), acting as a neutral complaint resolver and not as an advocate for any of the parties involved in a dispute. The Ombudsperson can provide information on policies and procedures affecting students, facilitate students’ contact with services able to assist in resolving the problem, and assist students in complaints concerning improper application of University policies or procedures. All matters referred to this office are held in strict confidence. The only exceptions, at the sole discretion of the Ombudsperson, are cases where there appears to be imminent threat of serious harm. The Student Advocate’s Office (SAO) is an executive, non-partisan office of the ASUC. We offer free, confidential casework services and resources to any student(s) navigating issues with the University, including academic, conduct, financial aid, and grievance concerns. All support is centered around students and aims for an equity-based approach. For recovery from sexual harassment or sexual assault . The Care Line (510-643-2005) is a 24/7, confidential, free, campus-based resource for urgent support around sexual assault, sexual harassment, interpersonal violence, stalking, and invasion of sexual privacy. The Care Line will connect you with a confidential advocate for trauma-informed crisis support including time-sensitive information, securing urgent safety resources, and accompaniment to medical care or reporting. For social services . Social Services provides confidential services and counseling to help students with managing problems that can emerge from illness such as financial, academic, legal, family concerns, and more. They specialize in helping students with pregnancy resources and referrals; alcohol/drug problems related to one’s own or a family member’s use; sexual assault/rape; relationship or other violence; and support for health concerns-new diagnoses or ongoing conditions. Social Services staff will assess a student’s immediate needs, work with the student to develop a plan to meet those needs, and facilitate arrangements with academic departments and advocate for the student with other campus offices and community agencies, as well as coordinate services within UHS. For finding community on campus . The mission of the Berkeley International Office (2299 Piedmont Avenue, 510-642-2818) is to provide support with all the essential resources needed to not only survive, but thrive here at UC Berkeley. Their mission is to support you and work together towards justice and belonging for all. They define Basic Needs as the essential resources that impact your health, belonging, persistence, and overall well being. It is an ecosystem that includes: nutritious food, stable housing, hygiene, transportation, healthcare, mental wellness, financial sustainability, sleep, and emergency dependent services. They refuse to accept hunger, homelessness, and all other basic needs injustices as part of our university. The Gender Equity Resource Center, fondly referred to as GenEq, is a UC Berkeley campus community center committed to fostering an inclusive Cal experience for all. GenEq is the campus location where students, faculty, staff and Alumni connect for resources, services, education and leadership programs related to gender and sexuality. The programs and services of the Gender Equity Resource Center are focused into four key areas: women; lesbian, gay, bisexual, and transgender (LGBT); sexual and dating violence; and hate crimes and bias driven incidents. GenEq strives to provide a space for respectful dialogue about sexuality and gender; illuminate the interrelationship of sexism, homophobia and gender bias and violence; create a campus free of violence and hate; provide leadership opportunities; advocate on behalf of survivors of sexual, hate, dating and gender violence; foster a community of women and LGBT leaders; and be a portal to campus and community resources on LGBT, Women, and the many intersections of identity (e.g., race, class, ability, etc.). The Undocumented Students Program (119 Cesar Chavez Center; 642-7224) practices a holistic, multicultural and solution-focused approach that delivers individualized service for each student. The academic counseling, legal support, financial aid resources and extensive campus referral network provided by USP helps students develop the unique gifts and talents they each bring to the university, while empowering a sense of belonging. The program’s mission is to support the advancement of undocumented students within higher education and promote pathways for engaged scholarship. The Multicultural Education Program (MEP) is one of six initiatives funded by the Evelyn and Walter Haas, Jr. Fund to work towards institutional change and to create a positive campus climate for diversity. The MEP is a five-year initiative to establish a sustainable infrastructure for activities like educational consultation and diversity workshops for the campus that address both specific topics, and to cater to group needs across the campus. For basic needs (food, shelter, etc.) . The Basic Needs Center (lower level of MLK Student Union, Suite 72) provides support with all the essential resources needed to not only survive, but thrive here at UC Berkeley. Their mission is to support you and work together towards justice and belonging for all. They define Basic Needs as the essential resources that impact your health, belonging, persistence, and overall well being. It is an ecosystem that includes: nutritious food, stable housing, hygiene, transportation, healthcare, mental wellness, financial sustainability, sleep, and emergency dependent services. They refuse to accept hunger, homelessness, and all other basic needs injustices as part of our university. The UC Berkeley Food Pantry (#68 Martin Luther King Student Union) aims to reduce food insecurity among students and staff at UC Berkeley, especially the lack of nutritious food. Students and staff can visit the pantry as many times as they need and take as much as they need while being mindful that it is a shared resource. The pantry operates on a self-assessed need basis; there are no eligibility requirements. The pantry is not for students and staff who need supplemental snacking food, but rather, core food support. ", - "url": "/su23/resources/#wellness-resources", + "url": "/fa23-testing/resources/#wellness-resources", "relUrl": "/resources/#wellness-resources" },"54": { "doc": "Resources", "title": "Data Science Education", "content": "Interested in bringing the Data Science major or curriculum to your academic institution? Please fill out this form if you would like support from Berkeley in offering some variant of our Data Science courses at your institution (or just to let us know that you’re interested). Information about the courses appear at data8.org and ds100.org. Please note that this form is only for instructors. If you are only interested in learning Python or data science, please look at our Data 8 or Data 100 websites mentioned above. ", - "url": "/su23/resources/#data-science-education", + "url": "/fa23-testing/resources/#data-science-education", "relUrl": "/resources/#data-science-education" },"55": { "doc": "Resources", "title": "Local Setup (Old)", "content": "NOTE: This section is out of date and no longer supported by the course staff. Click here to read our guide on how to set up our development environment locally (as an alternative to using DataHub). Please note that any autograder tests will only work on DataHub. ", - "url": "/su23/resources/#local-setup-old", + "url": "/fa23-testing/resources/#local-setup-old", "relUrl": "/resources/#local-setup-old" },"56": { "doc": "Local Setup", "title": "Local Setup", "content": "We will still be using datahub as our primary computing environment. This page serves as a guide for alternative environment setup. In other words: you don’t have to follow these instructions unless you’d like an alternative to datahub. ", - "url": "/su23/setup/", + "url": "/fa23-testing/setup/", "relUrl": "/setup/" },"57": { "doc": "Local Setup", "title": "Contents", "content": ". | Installing conda by OS . | OSX | Windows | Linux | . | Creating your environment | Working on assignments locally | Opening notebooks locally | Verifying your environment | Removing the environment to start over | Submitting your work | FAQ | . ", - "url": "/su23/setup/#contents", + "url": "/fa23-testing/setup/#contents", "relUrl": "/setup/#contents" },"58": { "doc": "Local Setup", "title": "OSX", "content": ". | You will need access to the command line. On a Mac, you can open the Terminal by opening Spotlight (Cmd + Space) and typing \"Terminal\". Alternatively, you can go to your Applications screen and select Terminal (it might be in the folder named \"Other\") . | Homebrew is a package manager for OSX. If you haven’t already, install it by running the following in the command line (copy, paste, and enter): . # This downloads the Ruby code of the installation script and runs it /usr/bin/ruby -e \"$(curl -fsSL https://raw.githubusercontent.com/Homebrew/install/master/install)\" . Verify your installation by making sure brew --version doesn’t error at your terminal. | Download and install Anaconda: . # Uses curl to download the installation script curl https://repo.continuum.io/miniconda/Miniconda2-4.5.11-MacOSX-x86_64.sh > miniconda.sh # Run the miniconda installer (you will need to enter your password) bash miniconda.sh . | Close and restart your terminal. Ensure the installation worked by running conda --version. | . You may remove the miniconda.sh script now if you’d like. Click here to continue to the next part of the setup. ", - "url": "/su23/setup/#osx", + "url": "/fa23-testing/setup/#osx", "relUrl": "/setup/#osx" },"59": { "doc": "Local Setup", "title": "Windows", "content": "Windows is especially prone to error if you aren’t careful about your configuration. If you’ve already had Anaconda or git installed and can’t get the other to work, try uninstalling everything and starting from scratch. Installing Anaconda: . | Visit the Anaconda website and download the installer for Python 3.7. Download the 64-bit installer if your computer is 64-bit (most likely), the 32-bit installer if not. See this FAQ if you are unsure. | Run the exe file to install Anaconda. Leave all the options as default (install for all users, in the default location). Make sure both of these checkboxes are checked: . | . 1) Verify that the installation is working by starting the Anaconda Prompt (you should be able to start it from the Start Menu) and typing python: . Notice how the python prompt shows that it is running from Anaconda. Now you have conda installed! . From now on, when we talk about the “Terminal” or “Command Prompt”, we are referring to the Anaconda Prompt that you just installed. Click here to continue to the next part of the setup. ", - "url": "/su23/setup/#windows", + "url": "/fa23-testing/setup/#windows", "relUrl": "/setup/#windows" },"60": { "doc": "Local Setup", "title": "Linux", "content": "These instructions assume you have apt-get (Ubuntu and Debian). For other distributions of Linux, substitute the appropriate package manager. | Your terminal program allows you to type commands to control your computer. On Linux, you can open the Terminal by going to the Applications menu and clicking “Terminal”. | Install wget. This is a command-line tool that lets you download files / webpages at the command line. sudo apt-get install wget . | Download the Anaconda installation script: . wget -O install_anaconda.sh https://repo.continuum.io/miniconda/Miniconda2-4.5.11-Linux-x86_64.sh . | . 4) Install Anaconda: . bash install_anaconda.sh . 5) Close and restart your terminal. Ensure the installation worked by running `conda --version`. You may remove the install_anaconda.sh script now if you’d like. Click here to continue to the next part of the setup. ", - "url": "/su23/setup/#linux", + "url": "/fa23-testing/setup/#linux", "relUrl": "/setup/#linux" },"61": { "doc": "Local Setup", "title": "Creating your environment", "content": "These instructions are the same for OSX, Windows, and Linux. | Download the data100 data100_environment.yml] from the course repository here or: . # download via curl curl https://raw.githubusercontent.com/DS-100/su20/gh-pages/resources/assets/local_setup/data100_environment.yml > data100_environment.yml # OR download via wget wget -O data100_environment.yml https://raw.githubusercontent.com/DS-100/su20/gh-pages/resources/assets/local_setup/data100_environment.yml . | . This YAML file is what we use to specify the dependencies and packages (and their versions) we wish to install into the conda environment we will make for this class. The purpose of the environment is to ensure that everyone in the course is using the same package versions for every assignment whether or not they are working on datahub. This is to prevent inconsistent behavior due to differences in package versions. | Using the Terminal, navigate to the directory where you downloaded data100_environment.yml. Run these commands to create a new conda environment. Each conda environment maintains its own package versions, allowing us to switch between package versions easily. For example, this class uses Python 3, but you might have another that uses Python 2. With a conda environment, you can switch between those at will. # sanity check on conda installation. Should be 4.5 or higher conda --version # update conda just in case it's out of date # enter y if prompted to proceed conda update conda # download git conda install -c anaconda git # Create a python 3.6 conda environment with the full set # of packages specified in environment.yml (jupyter, numpy, pandas, ...) conda env create -f data100_environment.yml # Switch to the data100 environment conda activate data100 # Check if packages are in the environment # This should not be empty! conda list . | . From now on, you can switch to the data100 env with conda activate data100, and switch back to the default env with conda deactivate. ", - "url": "/su23/setup/#creating-your-environment", + "url": "/fa23-testing/setup/#creating-your-environment", "relUrl": "/setup/#creating-your-environment" },"62": { "doc": "Local Setup", "title": "Working on assignments locally", "content": "These instructions are the same for OSX, Windows, and Linux. To work on assignments, you should fetch the assignment on datahub, navigate to the assignment folder and click on the download icon on the top right: . Then you can unzip the files into a folder of your choosing. Remember the location of your assignment files because you’ll need to navigate to that folder to open the notebook. ", - "url": "/su23/setup/#working-on-assignments-locally", + "url": "/fa23-testing/setup/#working-on-assignments-locally", "relUrl": "/setup/#working-on-assignments-locally" },"63": { "doc": "Local Setup", "title": "Opening notebooks locally", "content": "To open Jupyter notebooks, you’ll navigate to parent directory of the assignment in your terminal, activate the environment, and start up a jupyter server. This will look something like: . cd path/to/assignment/directory conda activate data100 jupyter notebook . This will automatically open the notebook interface in your browser. You can then browse to a notebook and open it. Make sure to always work in the data100 conda environment when you are using jupyter notebooks for this class. This ensures you have all the necessary packages required for the notebook to run. ", - "url": "/su23/setup/#opening-notebooks-locally", + "url": "/fa23-testing/setup/#opening-notebooks-locally", "relUrl": "/setup/#opening-notebooks-locally" },"64": { "doc": "Local Setup", "title": "Verifying Your Environment", "content": "You can tell if you are correct environment if your terminal looks something like: . Additionally, . conda env list . outputs a list of all your conda environments, and data100 should appear with a * next to it (the active one). ", - "url": "/su23/setup/#verifying-your-environment", + "url": "/fa23-testing/setup/#verifying-your-environment", "relUrl": "/setup/#verifying-your-environment" },"65": { "doc": "Local Setup", "title": "Removing the environment to start over", "content": "If you feel as if you’ve messed up and need to start over, you can remove the environment with . conda remove --name data100 --all . To verify that the environment was removed, in your Terminal window or an Anaconda Prompt, run: . conda info --envs . Which should then no longer display the data100 environment. ", - "url": "/su23/setup/#removing-the-environment-to-start-over", + "url": "/fa23-testing/setup/#removing-the-environment-to-start-over", "relUrl": "/setup/#removing-the-environment-to-start-over" },"66": { "doc": "Local Setup", "title": "Submitting your work", "content": "Submissions will still be handled via datahub. To upload your work, navigate to the appropriate assignment folder on datahub and click on the upload button on the top right. Remember to validate, submit, and upload to Gradescope (for homeworks and projects). ", - "url": "/su23/setup/#submitting-your-work", + "url": "/fa23-testing/setup/#submitting-your-work", "relUrl": "/setup/#submitting-your-work" },"67": { "doc": "Local Setup", "title": "FAQ", "content": "Shell not properly configured to use conda activate . If you had an older version of Anaconda installed (perhaps for another class), you may see the following message. Follow the instructions in the prompt to: . | Enable conda for all users sudo ln -s ... | Put the base environment on PATH echo \"conda activate\" >> ~/.bash_profile\". Note that ~/.bash_profile may be something different like ~/.bashrc. | Manually remove the line that looks like export PATH=\"/usr/local/miniconda3/bin:$PATH\" from your .bash_profile. Use your favorite plaintext editor to do this (do not use a rich text editor like Microsoft Word!). | . ", - "url": "/su23/setup/#faq", + "url": "/fa23-testing/setup/#faq", "relUrl": "/setup/#faq" },"68": { "doc": "Staff", "title": "Staff", "content": "Jump to: Instructors, Teaching Assistants, Readers. Note: Consult the calendar for the most up-to-date office hours for each GSI. All GSI Office Hours will be held in Warren 101B. ", - "url": "/su23/staff/", + "url": "/fa23-testing/staff/", "relUrl": "/staff/" },"69": { "doc": "Staff", "title": "Course Staff Email", "content": "Contact course staff via Ed with any questions or concerns. For sensitive matters, the staff email address data100.instructors@berkeley.edu is monitored by the instructors and a few lead TAs. ", - "url": "/su23/staff/#course-staff-email", + "url": "/fa23-testing/staff/#course-staff-email", "relUrl": "/staff/#course-staff-email" },"70": { "doc": "Staff", "title": "Instructors", - "content": "Bella Crouch She/Her/Hers . isabella.crouch@berkeley.edu . Office Hours: Tue, Th 3-4pm (Warren 111) . Dominic Liu He/Him/His . hangxingliu@berkeley.edu . Office Hours: Mon, Wed 3-4pm (Warren 111) . ", - "url": "/su23/staff/#instructors", + "content": "Fernando Pérez He/Him/His . fernando.perez@berkeley.edu . Narges Norouzi She/Her/Hers . norouzi@berkeley.edu . ", + "url": "/fa23-testing/staff/#instructors", "relUrl": "/staff/#instructors" },"71": { "doc": "Staff", "title": "Teaching Assistants", "content": "Alan Jian He/Him/His . alanjian131@berkeley.edu . Office Hours: Mon, Wed 1-3 . Hi there, my name is Alan and I’m a 5th year MIDS student with a background in natural language processing and an interest in data engineering and data ethics. When I’m not doing data things, you’ll either find me playing tennis at the Hearst courts or curled up at home with a good book :) . Bennett Somerville He/Him/His . bdsomer@berkeley.edu . Office Hours: Mon, Tue 1-3 . I’m a rising third-year undergraduate student majoring in computer science. I enjoy writing code, teaching, cycling, repairing bikes, playing music, and learning languages, among other things. Feel free to reach out! . Celine Choi She/Her/Hers . celinejwchoi@berkeley.edu . Office Hours: Mon, Wed 1-3 . Hey everyone! I am a rising junior studying CS. This is my second year on course staff and I’m super stoked to meet you all :) . Mihran Miroyan He/Him/His . miroyan.mihran@berkeley.edu . Office Hours: Mon, Thu 3-5 . Hey, I am Mir! . Milad Shafaie He/Him/His . mshafaie@berkeley.edu . Office Hours: Tue 4-5, Wed 3-5, Thu 1-2 . Hello . Nathan Harounian He/Him/His . nathanharounian@berkeley.edu . Office Hours: Fri 12-4 . Hey! I’m a senior studying Statistics and Data Science. In my free time, I enjoy hanging out with my friends, listening to music, archery, and poker! I really enjoyed taking Data 100 last summer and look forward to helping y’all this summer :) . Stephanie Xu She/Her/Hers . stephanie.xu@berkeley.edu . Office Hours: Mon 11-1, Tue 12-1, Wed 12-1 . Hi! I’m a CS and Data Science double major and I’m super excited to be one of your uGSIs! Feel free to reach out to me if you have any questions regarding the course or simply want someone to talk to! . Tina Chen She/Her/Hers . czz129@berkeley.edu . Office Hours: Thu, Fri 1-3 . Hi Everyone! I’am Tina a rising senior majoring DS + stats. I’m super exicting to meet with everyone. Feel free to reach out to me for any questions! :))) . Yash Dave He/Him/His . yashdave003@berkeley.edu . Office Hours: Mon 12-1, Tue 12-2, Wed 12-1 . Hi! I’m Yash, a rising junior majoring in Applied Math and CS with a minor in Public Policy. Excited to be teaching Data 100 over the summer!! . Yuerou Tang They/Them/Theirs . yuerou.tang@berkeley.edu . Hi! I’m a senior studying CS and Conservation & Resource Studies. Check out my website for cool bird pictures I took!! . Zaid Maayah He/Him/His . zaidmaayah@berkeley.edu . Office Hours: Tue, Thu 2-4 . Hi everyone! I’m a rising fourth-year international student from Jordan, double majoring in Data science and Linguistics. I like traveling, compiling playlists, and rating every restaurant in Berkeley. I hope you enjoy the course! . ", - "url": "/su23/staff/#teaching-assistants", + "url": "/fa23-testing/staff/#teaching-assistants", "relUrl": "/staff/#teaching-assistants" },"72": { "doc": "Staff", "title": "Readers", "content": "Aneesh Durai He/Him/His . aneesh.durai@berkeley.edu . Hi! I’m Aneesh, and I’m very excited to be working with you this summer! . Anthony Zhang He/Him/His . anthony_zhang1234@berkeley.edu . yooo it’s anthony - im an expert in bonking on my bike, entering food coma, and tripping myself in dance dance revolution. i like to study quik mafs and cs . Archer Parry He/Him/His . archerp@berkeley.edu . Hi, I am a rising senior that enjoys hanging out with friends and playing games in my free time. Asbah Wasim She/Her/Hers . asbahwasim@berkeley.edu . Hi there, welcome to Data 100! I am a rising junior studying Cognitive Science and Data Science. In my free time, I enjoy drawing nature, painting scenery, organizing, and going on walks. I look forward to meeting you over the summer, and hope you have a great time in the class! . Hans Mao He/Him/His . huanzhimao@berkeley.edu . Hello! I’m a rising junior majoring in CS and Stat. I’m interested in computer security, distributed systems, and machine learning. I <3 Data 100! Besides teaching, I enjoy sailing, hiking, and swimming. Looking forward to an awesome semester :o (Generated by ChatGPT) . Matthew Lee He/Him/His . matthewlee3@berkeley.edu . hey i’m matthew and i like great vibes. please hit me up if you have a life changing restaurant. Yehchan Yoo He/Him/His . yehchanyoo@berkeley.edu . Hello — I am a senior majoring in Statistics and Political Economy & minoring in Data Science; I like to read the news, watch YouTube videos, listen to rock and electronic music, mediate, lift weights, and do boxing in my free time. Hope you all will enjoy the course, and always feel free to reach out! . ", - "url": "/su23/staff/#readers", + "url": "/fa23-testing/staff/#readers", "relUrl": "/staff/#readers" },"73": { "doc": "Syllabus", "title": "Syllabus", "content": "Jump to: . | About Data 100 . | Goals | Prerequisites | . | Course Culture . | Be Aware of Your Actions | Be Respectful | Communicate Issues with Course Staff and/or the Department | . | Course Delivery | Course Components . | Lecture | Discussion | Homework and Projects | Lab | Exams | . | Office Hours and Communication | Policies . | Grading Scheme | On-Time Submission | Grace Period | Extenuating Circumstances | DSP Accommodations | Regrade Requests | Collaboration Policy and Academic Honesty | . | Academic and Wellness Resources | We want you to succeed! | Acknowledgments | . ", - "url": "/su23/syllabus/", + "url": "/fa23-testing/syllabus/", "relUrl": "/syllabus/" },"74": { "doc": "Syllabus", "title": "About Data 100", "content": "Combining data, computation, and inferential thinking, data science is redefining how people and organizations solve challenging problems and understand their world. This intermediate level class bridges between Data 8 and upper division computer science and statistics courses as well as methods courses in other fields. In this class, we explore key areas of data science including question formulation, data collection and cleaning, visualization, statistical inference, predictive modeling, and decision making.​ Through a strong emphasis on data centric computing, quantitative critical thinking, and exploratory data analysis, this class covers key principles and techniques of data science. These include languages for transforming, querying and analyzing data; algorithms for machine learning methods including regression, classification and clustering; principles behind creating informative data visualizations; statistical concepts of measurement error and prediction; and techniques for scalable data processing. Goals . | Prepare students for advanced Berkeley courses in data-management, machine learning, and statistics, by providing the necessary foundation and context. | Enable students to start careers as data scientists by providing experience working with real-world data, tools, and techniques. | Empower students to apply computational and inferential thinking to address real-world problems. | . Prerequisites . While we are working to make this class widely accessible, we currently require the following (or equivalent) prerequisites. Prerequisites will be enforced in Data 100. It is your responsibility to know the material in the prerequisites. The instructors do not have the authority to waive these requirements. Undergraduates should fill out the Enrollment Exception Form managed by CDSS to request an exception. | Foundations of Data Science: Data 8 covers much of the material in Data 100 but at an introductory level. Data 8 provides basic exposure to python programming and working with tabular data as well as visualization, statistics, and machine learning. | Computing: The Structure and Interpretation of Computer Programs (CS 61A) or Computational Structures in Data Science (Data 88C). These courses provide additional background in python programming (e.g., for loops, lambdas, debugging, and complexity) that will enable Data 100 to focus more on the concepts in Data Science and less on the details of programming in python. | Math: Linear Algebra (Math 54, EECS 16A, Math 91, Math 110, or Stat 89A). We will need some basic concepts like linear operators, eigenvectors, derivatives, and integrals to enable statistical inference and derive new prediction algorithms. This may be satisfied concurrently to Data 100. | . Please consult the Resources page for additional resources for reviewing prerequisite material. Textbook: There is no official textbook for Data 100 this semester; we will provide course notes that will be released with the respective lectures. ", - "url": "/su23/syllabus/#about-data-100", + "url": "/fa23-testing/syllabus/#about-data-100", "relUrl": "/syllabus/#about-data-100" },"75": { "doc": "Syllabus", "title": "Course Culture", "content": "Students taking Data C100 come from a wide range of backgrounds. We hope to foster an inclusive and safe learning environment based on curiosity rather than competition. All members of the course community — the instructors, students, and course staff — are expected to treat each other with courtesy and respect. Some of the responsibility for that lies with the staff, but a lot of it ultimately rests with you, the students. Be Aware of Your Actions . Sometimes, the little things add up to creating an unwelcoming culture to some students. For example, you and a friend may think you are sharing in a private joke about other races, majors, genders, abilities, cultures, etc. but this can have adverse effects on classmates who overhear it. There is a great deal of research on something called “stereotype threat”: research finds that simply reminding someone that they belong to a particular culture or share a particular identity (on whatever dimension) can interfere with their course performance. Stereotype threat works both ways: you can assume that a student will struggle based on who they appear to be, or you can assume that a student is doing great based on who they appear to be. Both are potentially harmful. Bear in mind that diversity has many facets, some of which are not visible. Your classmates may have medical conditions (physical or mental), personal situations (financial, family, etc.), or interests that aren’t common to most students in the course. Another aspect of professionalism is avoiding comments that (likely unintentionally) put down colleagues for situations they cannot control. Bragging in open space that an assignment is easy or “crazy,” for example, can send subtle cues that discourage classmates who are dealing with issues that you can’t see. Please take care, so we can create a class in which all students feel supported and respected. Be Respectful . Beyond the slips that many of us make unintentionally are a host of behaviors that the course staff, department, and university do not tolerate. These are generally classified under the term harassment; sexual harassment is a specific form that is governed by federal laws known as Title IX. UC Berkeley’s Title IX website provides many resources for understanding the terms, procedures, and policies around harassment. Make sure you are aware enough of these issues to avoid crossing a line in your interactions with other students. For example, repeatedly asking another student out on a date after they have said no can cross this line. Your reaction to this topic might be to laugh it off, or to make or think snide remarks about “political correctness” or jokes about consent or other things. You might think people just need to grow a thicker skin or learn to take a joke. This isn’t your decision to make. Research shows the consequences (emotional as well as physical) on people who experience harassment. When your behavior forces another student to focus on something other than their education, you have crossed a line. You have no right to take someone else’s education away from them. Communicate Issues with Course Staff and/or the Department . We take all complaints about unprofessional or discriminatory behavior seriously. Professionalism and respect for diversity are not just matters between students; they also apply to how the course staff treat the students. The staff of this course will treat you in a way that respects our differences. However, despite our best efforts, we might slip up, hopefully inadvertently. If you are concerned about classroom environment issues created by the staff or overall class dynamic, please feel free to talk to us about it. The instructors in particular welcome any comments or concerns regarding conduct of the course and the staff. See below for how to best reach us. From the Data Science Department: Data Science Undergraduate Studies faculty and staff are committed to creating a community where every person feels respected, included, and supported. We recognize that incidents may happen, sometimes unintentionally, that run counter to this goal. There are many things we can do to try to improve the climate for students, but we need to understand where the challenges lie. If you experience a remark, or disrespectful treatment, or if you feel you are being ignored, excluded or marginalized in a course or program-related activity, please speak up. Consider talking to your instructor, but you are also welcome to contact Executive Director Christina Teller at cpteller@berkeley.edu or report an incident anonymously through this online form. As course staff, we are committed to creating a learning environment welcoming of all students that supports a diversity of thoughts, perspectives and experiences and respects your identities and backgrounds (including race, ethnicity, nationality, gender identity, socioeconomic class, sexual orientation, language, religion, ability, and more.) To help accomplish this: . | If your name and/or pronouns differ from those that appear in your official records, please let us know. | If you feel like your performance in the class is being affected by your experiences outside of class (e.g., family matters, current events), please don’t hesitate to come and talk with us. We want to be resources for you. | We (like many people) are still in the process of learning about diverse perspectives and identities. If something was said in class (by anyone) that made you feel uncomfortable, please talk to us about it. | While the course staff understands that improving diversity, equity, and inclusion (DEI) are not enough to overcome systemic issues in academia such as racism, queerphobia, and other forms of discrimination and hatred, we also recognize the importance of DEI work. | The Data Science Department has some resources available at https://data.berkeley.edu/about/diversity-equity-and-inclusion. | There’s also a great set of resources available at https://eecs.berkeley.edu/resources/students/grievances. | . | If there are other resources you think we should list here, let us know! | . ", - "url": "/su23/syllabus/#course-culture", + "url": "/fa23-testing/syllabus/#course-culture", "relUrl": "/syllabus/#course-culture" },"76": { "doc": "Syllabus", "title": "Course Delivery", "content": "In keeping with departmental guidelines set by the Division of Computing, Data Science, and Society, all Data Science courses at Berkeley are offered fully in-person in Summer 2023. This summer’s offering of Data 100 will be taught solely in-person. If you are unable to attend in-person discussion sections and office hours this summer, you are strongly encouraged to consider taking a different course. If you are unable to attend the in-person Midterm and Final, you cannot take Data 100 in Summer 2023. ", - "url": "/su23/syllabus/#course-delivery", + "url": "/fa23-testing/syllabus/#course-delivery", "relUrl": "/syllabus/#course-delivery" },"77": { "doc": "Syllabus", "title": "Course Components", "content": "Below is a high-level “typical week in the course” for Summer 2023. | Mo | Tu | We | Th | Fr | Sat | . | Office Hours | Office Hours | Office Hours | Office Hours | Office Hours |   | . | Live Lecture | Live Lecture | Live Lecture | Live Lecture |   |   | . | Discussion Section |   | Discussion Section |   | Exam Prep/Catch-Up |   | . | Homework due |   |   | Homework due |   |   | . |   |   |   |   |   | 2 Labs due | . | All deadlines are subject to change. | Office Hours are scheduled on the Calendar page. | Lectures, discussions, assignments, projects, and exams are scheduled on the Home page. | . Lecture . There are 4 live lectures held Mondays to Thursdays, 5:00 pm - 6:30 pm, in-person in Li Ka Shing 245. All lecture recordings, slides, activities, and examples will be provided to the course website within 24 hours of the lecture. Discussion . Live discussion sections are one hour long sessions held twice weekly on Mondays and Wednesdays. The goal of these GSI-led sessions is to work through problems, hone your skills, and flesh out your understanding as part of a team. The problems that you solve and present as part of discussion are important in understanding course material. The lectures, assignments, and exams of this course are structured with the expectation that all students attend discussion. The content covered in these sections is designed to solidify understanding of key lecture concepts and prepare students for homework assignments. It is to your benefit to actively participate in all discussions! . | Discussion attendance will be recorded each week and account for 5% of the overall grade | All students are automatically granted 3 discussion drops to use for illness, personal emergencies, or other extenuating circumstances. These drops are designed to account for unexpected events – you should not plan to use them! | Attending the exam-prep session on Friday can replace either a missed Monday or a missed Wednesday section only for that specific week. Details about exam-prep sections will be released in the second week of classes. | Students with low discussion attendance scores may alternatively shift this 5% of the course grade onto their homework score. Course staff will automatically determine which grading policy will maximize your final grade in the course at the end of the semester. | . You will be invited to share your timing preferences for discussions and assigned to a section in the first week of classes. Homework and Projects . Homeworks are half-week-long assignments designed to help students develop an in-depth understanding of both the theoretical and practical aspects of ideas presented in lecture. Projects are week-long assignments (with a half-week checkpoint) that synthesize multiple topics. Typically, assignments will be due at 11:59 pm on Mondays and Thursdays. | All homeworks and projects must be submitted to Gradescope by their posted deadlines. | Each assignment will include detailed instructions on how to submit your work for grading. It is the student’s responsibility to read these carefully and ensure that their work is submitted correctly. Assignment accommodations will not be granted in cases where students have mis-submitted their work (for example, by submitting to the wrong portal, submitting only part of an assignment, forgetting to select pages, or failing to pass autograder tests) | . | Homeworks and projects have both visible and hidden autograder tests. The visible tests are mainly sanity checks. For example, a sanity check might verify that the answer you entered is a number as expected, and not a word. The hidden tests generally check for correctness, and are invisible to students while they are doing the assignment. | The primary form of support students will have for homeworks and projects are office hours and Ed. | Homeworks and projects must be completed individually. See the Collaboration Policy for more details. | See the Policies section for the submission grace period. | . Lab . Labs are shorter programming assignments designed to give students familiarity with new ideas. They are meant to be completed prior to homework. Two lab assignments will be released at the start of each week, covering content that will be presented in that week’s lectures. The first of these two assignments will cover the content presented in Monday’s and Tuesday’s lectures; the second will cover the content presented in Wednesday’s and Thursday’s lectures. Both weekly lab assignments are due at 11:59 pm on the Saturday of the corresponding week. | All lab assignments must be submitted to Gradescope by their posted deadlines. | All lab autograder tests are visible. Receiving full points on the autograder guarantees that you will be awarded full points on the lab assignment. | All lab assignments will be accompanied by a video walkthrough with explanations of key concepts. There will be no synchronous lab sections, however, students are welcome to bring questions about lab to office hours. | All labs are intended to take about an hour. | . Exams . There will be two exams in this course: . | Midterm on Thursday, July 20 5-7 PM. | Final on Thursday, August 10 5-7 PM. | . All exams must be taken in-person. There will be one alternate final exam on August 10 6:30-8:30PM. ", - "url": "/su23/syllabus/#course-components", + "url": "/fa23-testing/syllabus/#course-components", "relUrl": "/syllabus/#course-components" },"78": { "doc": "Syllabus", "title": "Office Hours and Communication", "content": "We want to enable everyone to succeed in this course. We encourage you to discuss course content with your friends, classmates, and course staff throughout the semester, particularly during office hours. | All office hours are listed on the Calendar. | GSI office hours will be held in Warren Hall 101B. | In general, students can come to GSI office hours for any questions on course assignments or material. | Instructor office hours are generally reserved for conceptual questions, course review, or course logistics. | . Course Communication: . | EdStem, or Ed for short, is our course forum this semester. The course is here. All course announcements will be through Ed. We are not using bCourses this semester. Please check out Ed or the FAQ page first before emailing course staff directly. | Ed is a formal, academic space. We must demonstrate appropriate respect, consideration, and compassion for others. Please be friendly and thoughtful; our community draws from a wide spectrum of valuable experiences. For further reading, please reference Berkeley’s Principles of Community and the Berkeley Campus Code of Student Conduct. | . | . Ed is your primary platform for asking questions about the class. It is monitored daily by the entire course staff, so questions posted to Ed will likely receive the fastest response. If you need to discuss a more sensitive matter, the following emails are monitored by a smaller subset of the teaching team: . | For logistical questions: our course staff email is data100.instructors@berkeley.edu. | For extenuating circumstances/DSP: student accommodation requests will be handled via the Extenuating Circumstances Form. Our staff email for student support and DSP accommodations is data100.support@berkeley.edu. | Please only contact the course instructors directly for matters that require strict privacy and their personal attention. | . | . ", - "url": "/su23/syllabus/#office-hours-and-communication", + "url": "/fa23-testing/syllabus/#office-hours-and-communication", "relUrl": "/syllabus/#office-hours-and-communication" },"79": { "doc": "Syllabus", "title": "Policies", "content": "Grading Scheme . | Category | Percentage | Details | . | Homeworks | 25% | Drop lowest | . | Projects | 15% | No drop | . | Labs | 10% | Drop 2 lowest scores | . | Discussion | 5% | Drop 3 lowest scores | . | Midterm Exam | 15% |   | . | Final Exam | 30% |   | . Discussion attendance is expected for the summer session. Students with low discussion attendance scores may alternatively shift this 5% of the course grade onto their homework score, such that homework is worth 30% of the overall grade. Course staff will automatically apply whichever grading policy will maximize your final grade in the course at the end of the semester. On-Time Submission . All assignments are due at 11:59 PM Pacific Time on the due date specified on the Home / Schedule page. The date and time of this deadline are firm. Submitting even a minute past is considered late. Submitting by this “on-time” deadline earns an extra-credit on-time bonus, a 3% perk. This is available for homeworks, projects, and labs. Grace Period . We recognize that life can be unexpected, and that you may face circumstances that prevent you from submitting your work by the posted deadline. In light of this, we offer a 1-day (24 hour) grace period for late submissions of homeworks, projects, and labs. Note that this grace period is designed to account for unexpected emergencies or assignment submission errors – you should not plan in advance to use it! . You can make a late submission after the on-time deadline and up to the end of the grace period. These late submissions are not penalized, but do not earn 3% the on-time bonus. You do not need to explicitly contact staff about late submissions; just submit directly to Gradescope within the listed grace period. Submissions are not accepted beyond the grace period. The grace period is strictly enforced. We recommend thinking of the grace period as a backup, in case something unexpected comes up when aiming for the on-time deadline. As a result, getting an extension beyond the grace period will generally not be granted, except in rare, extraordinary emergencies (see the Extenuating Circumstances section). All official communication will refer to the on-time deadline as the expected dates that you will submit assignments. Extenuating Circumstances . We recognize that our students come from varied backgrounds and have widely-varying experiences. If you encounter extenuating circumstances at any time in the semester, please do not hesitate to let us know. The sooner we are made aware, the more options we have available to us to help you. The Extenuating Circumstances Form is for any circumstances that cannot be resolved via the grace period policy above. Within two business days of filling out the form, a course staff will reach out to you and provide a space for conversation, as well as to arrange course/grading accommodations as necessary. For more information, please email data100.support@berkeley.edu. We recognize that at times, it can be difficult to manage your course performance — particularly in such a huge course, and particularly at Berkeley’s high standards. Sometimes emergencies just come up (personal health emergency, family emergency, etc.). Our Grace Period Policy combined with the Extenuating Circumstances Form is meant to lower the barrier to reaching out to us, as well as build your independence in managing your academic career long-term. So please do not hesitate to reach out. Note that extenuating circumstances do not extend to logistical oversight, such as Datahub/Gradescope tests not passing, submitting only one portion of the homework, forgetting to save your notebook before exporting, submitting to the wrong assignment portal, or not properly tagging pages on Gradescope. It is the student’s responsibility to identify and resolve these issues in advance of the on-time deadline. We will not grant accommodations for these cases; instead, please use the grace period to cushion these submission errors. DSP Accommodations . If you are registered with the Disabled Students’ Program (DSP) you can expect to receive an email from us during the first week of classes confirming your accommodations. Otherwise, email our support email. DSP students who receive approved assignment accommodations will have the 1-day grace period added to the approved extension to the on-time deadline. Please note that any extension, plus the grace period combined, cannot exceed 5 days. DSP students can submit assignment extension accommodation requests via the Extenuating Circumstances Form. You are responsible for reasonable communication with course staff. If you make a request close to the deadline, we can not guarantee that you will receive a response before the deadline. Additionally, simply submitting a request does not guarantee you will receive an extension. Even if your work is incomplete, please submit before the deadline so you can receive credit for the work you did complete. Regrade Requests . Students will be allowed to submit regrade requests for the autograded and written portions of assignments in cases in which the rubric was incorrectly applied or the autograder scored their submission incorrectly. Regrades for the written portions of assignments will be handled through Gradescope, and autograder regrades via a Google Form. The deadline for regrade requests (autograded and written) is one week after the grades are released for the corresponding assignment. Always check that the autograder executes correctly! Gradescope will show you the output of the public tests, and you should see the same results as you did on DataHub. If you see a discrepancy, ensure that you have exported the assignment correctly and, if there is still an issue, post on Ed as soon as possible. Regrade requests will not be considered in cases in which: . | a student uploads the incorrect file to the autograder. | the autograder fails to execute and the student does not notify the course staff before the assignment deadline. | a student fails to save their notebook before exporting and uploads an old version to the autograder. | a situation arises in which the course staff cannot ensure that the student’s work was done before the assignment deadline. | . Collaboration Policy and Academic Honesty . We will be following the EECS departmental policy on Academic Honesty, which states that using work or resources that are not your own or not permitted by the course may lead to disciplinary actions, including a failing grade in the course. Assignments. Data science is a collaborative activity. While you may talk with others about the homework and projects, we ask that you write your solutions individually in your own words. If you do discuss the assignments with others please include their names at the top of your notebook. Restated, you and your friends are encouraged to discuss course content and approaches to problem-solving, but you are not allowed to share your code nor answers with other students, nor are you allowed to post your assignment solutions publicly. Doing so is considered academic misconduct. We will be running advanced plagiarism detection programs on all assignments. Use of AI-assisted methods, such as ChatGPT, to generate written or code solutions to assignments is prohibited. Exams. Cheating on exams is a serious offense. We have methods of detecting cheating on exams – so don’t do it! Students caught cheating on any exam will fail this course. Plagiarism on any assignment, as well as other violations to Berkeley’s Code of Conduct, will be reported to the Center for Student Conduct. The CSC treats most first-time offenses as a Non-Reportable Warning. Additionally we reserve the right to give you a negative full score (-100%) or lower on the assignments in question, an F in the course, or even dismissal from the university. It’s just not worth it! . Rather than copying someone else’s work, ask for help. You are not alone in Data 100! The entire staff is here to help you succeed. We expect that you will work with integrity and with respect for other members of the class, just as the course staff will work with integrity and with respect for you. Finally, know that it’s normal to struggle. Berkeley has high standards, which is one of the reasons its degrees are valued. Everyone struggles, even though many try not to show it. Even if you don’t learn everything that’s being covered, you’ll be able to build on what you do learn, whereas if you cheat you’ll have nothing to build on. You aren’t expected to be perfect; it’s ok not to get an A. ", - "url": "/su23/syllabus/#policies", + "url": "/fa23-testing/syllabus/#policies", "relUrl": "/syllabus/#policies" },"80": { "doc": "Syllabus", "title": "Academic and Wellness Resources", "content": "Our Resources page lists not only course-specific academic resources such as course notes, past exams, study guides, and prerequisite review links, but also campus wellness resources on COVID-19, academic support, technology support, mental well-being, DSP accommodations, dispute resolution, social services, campus community, and basic needs. Our staff will also refer to this page when supporting you through this course. ", - "url": "/su23/syllabus/#academic-and-wellness-resources", + "url": "/fa23-testing/syllabus/#academic-and-wellness-resources", "relUrl": "/syllabus/#academic-and-wellness-resources" },"81": { "doc": "Syllabus", "title": "We want you to succeed!", "content": "If you are feeling overwhelmed, visit our office hours and talk with us, or fill out the Extenuating Circumstances Form. We know college can be stressful and we want to help you succeed. Important Note: We are committed to being a resource to you, but it is important to note that all members of the teaching staff for this course are responsible employees, meaning that we must disclose any incidents of sexual harassment or violence to campus authorities. If you would like to speak to a confidential advocate, please consider reaching out to the Berkeley PATH to Care Center. Finally, the main goal of this course is that you should learn, and have a fantastic experience doing so. Please keep that goal in mind throughout the semester. Welcome to Data 100! . ", - "url": "/su23/syllabus/#we-want-you-to-succeed", + "url": "/fa23-testing/syllabus/#we-want-you-to-succeed", "relUrl": "/syllabus/#we-want-you-to-succeed" },"82": { "doc": "Syllabus", "title": "Acknowledgments", "content": "Academic Honesty policy and closing words adapted from Data 8. Course Culture inspired and adapted with permission from Dr. Sarah Chasins’ Fall 2021 CS 164 Syllabus and Grace O’Connell, the Asssociate Dean for Inclusive Excellence. ", - "url": "/su23/syllabus/#acknowledgments", + "url": "/fa23-testing/syllabus/#acknowledgments", "relUrl": "/syllabus/#acknowledgments" } diff --git a/_site/calendar/index.html b/_site/calendar/index.html index dbfe55a..ca701d2 100644 --- a/_site/calendar/index.html +++ b/_site/calendar/index.html @@ -1 +1 @@ - Calendar | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Calendar

Note: If you are having trouble viewing the calendars below and are using Safari, we suggest switching to an alternate browser (like Chrome). Alternatively, you can go to Safari settings and switch “Prevent cross-site tracking” off, or you can see the first calendar here and the second calendar here.

Office Hours Calendar

In-person office hours are in blue, click on each event to see which GSI and/or reader is running each office hour time. You should come to these with questions about anything – labs, homeworks, discussions, concepts, etc.

Note: All office hours will be held in-person in Warren Hall 101B.

Instructor office hours with Bella and Dominic appear in red. You should come to these with questions about concepts.


Lecture, Discussion, and Special Events Calendar

This calendar contains times for

  • live lectures (in brown)
  • live discussion sections (in orange)
  • live exam prep and other reviews (in green)
+ Calendar | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Calendar

Note: If you are having trouble viewing the calendars below and are using Safari, we suggest switching to an alternate browser (like Chrome). Alternatively, you can go to Safari settings and switch “Prevent cross-site tracking” off, or you can see the first calendar here and the second calendar here.

Office Hours Calendar

In-person office hours are in blue, click on each event to see which GSI and/or reader is running each office hour time. You should come to these with questions about anything – labs, homeworks, discussions, concepts, etc.

Note: All office hours will be held in-person in Warren Hall 101B.

Instructor office hours with Bella and Dominic appear in red. You should come to these with questions about concepts.


Lecture, Discussion, and Special Events Calendar

This calendar contains times for

  • live lectures (in brown)
  • live discussion sections (in orange)
  • live exam prep and other reviews (in green)
diff --git a/_site/index.html b/_site/index.html index e27586f..e994429 100644 --- a/_site/index.html +++ b/_site/index.html @@ -1 +1 @@ - Home / Schedule | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Data 100: Principles and Techniques of Data Science

UC Berkeley, Summer 2023

Ed Datahub Gradescope Extenuating Circumstances

Bella Crouch

Bella Crouch

She/Her/Hers

isabella.crouch@berkeley.edu

Office Hours: Tue, Th 3-4pm (Warren 111)

Dominic Liu

Dominic Liu

He/Him/His

hangxingliu@berkeley.edu

Office Hours: Mon, Wed 3-4pm (Warren 111)

Welcome to Week 8!

Schedule

Week 1

Jun 20
Lecture 1 Course Overview
Note 1
Lab 1 Prerequisite Coding (due Jun 24)
Homework 1A Plotting and the Permutation Test (due Jun 26)
Homework 1B Prerequisite Math (due Jun 26)
Jun 21
Lecture 2 Pandas I
Note 2
Discussion 1 Math Prerequisites
Solution
Jun 22
Lecture 3 Pandas II
Note 3

Week 2

Jun 26
Lecture 4 Pandas III, EDA I
Note 4
Discussion 2 Pandas worksheet, worksheet notebook, groupwork notebook
Solution
Lab 2 Pandas (due Jul 1)
Lab 3 Data Cleaning and EDA (due Jul 1)
Homework 2 Pandas (due Jun 29)
Jun 27
Lecture 5 EDA II
Note 5
Jun 28
Lecture 6 Text Wrangling, Regex
Note 6
Discussion 3 EDA
Solution
Jun 29
Lecture 7 Visualization
Note 7
Homework 3 Tweets (due Jul 3)
Jun 30
Exam Prep 1 Pandas
Solution

Week 3

Jul 3
Break (no lecture)
Discussion 4 Regex (optional)
Solution, Video Walkthrough
Lab 4 Transformation (due Jul 8)
Lab 5 Modeling, Summary Statistics, Loss Functions (due Jul 8)
Homework 4 Bike Sharing (Visualization) (due Jul 6)
Jul 4
Independence Day (no lecture)
Jul 5
Lecture 8 Sampling
Note 8
Discussion 5 Visualization Worksheet, Notebook
Solution
Jul 6
Lecture 9 Modeling, SLR
Note 9
Homework 5A Sampling (due Jul 10)
Homework 5B Modeling (due Jul 10)
Jul 7
Exam Prep 2 Regex, KDE Plots
Solution

Week 4

Jul 10
Lecture 10 Constant model, loss, and transformations
Note 10
Discussion 6 Sampling, SLR
Solution
Lab 6 Ordinary Least Squares (due Jul 15)
Lab 7 Gradient Descent, Feature Engineering (due Jul 15)
Homework 6 Regression (due Jul 13)
Jul 11
Lecture 11 Ordinary Least Squares (Multiple Linear Regression)
Note 11
Jul 12
Lecture 12 Gradient Descent
Note 12
Discussion 7 Transformations, OLS
Solution
Jul 13
Lecture 13 Sklearn, Feature Engineering
Note 13
Project A1 Housing I (due Jul 17)

Week 5

Jul 17
Lecture 14 Case Study in Human Contexts and Ethics (CCAO)
Note 14
Discussion 8 Gradient Descent, Feature Engineering
Solution
Lab 8 Model Selection (due Jul 22)
Project A2 Housing II (due Jul 24)
Jul 18
Lecture 15 Cross-Validation, Regularization
Note 15
Jul 19
Break (no lecture)
Discussion 9 Exam Review
Jul 20
Midterm Midterm Exam (5-7 PM)

Week 6

Jul 24
Lecture 16 Random Variables
Note 16
Discussion 10 Cross-Validation, Regularization
Solution
Lab 9 Probability (due Jul 29)
Lab 10 Logistic Regression (due Jul 29)
Homework 7 Probability and Estimators (due Jul 27)
Jul 25
Lecture 17 Estimators, Bias, and Variance
Note 17
Jul 26
Lecture 18 Logistic Regression I
Note 18
Discussion 11 Random Variables, BVT
Solution
Jul 27
Lecture 19 Logistic Regression II
Note 19
Project B1 Spam & Ham I (due Jul 31)
Jul 28
Exam Prep 3 Regularization, Bias-Variance Tradeoff, Cross-Validation, Random Variables
Solution

Week 7

Jul 31
Lecture 20 SQL I
Note 20
Discussion 12 Logistic Regression
Solution
Lab 11 SQL (due Aug 5)
Lab 12 PCA (due Aug 5)
Project B2 Spam & Ham II (due Aug 3)
Aug 1
Lecture 21 SQL II
Note 21
Aug 2
Lecture 22 PCA I
Note 22
Discussion 13 SQL
Solution
Aug 3
Lecture 23 PCA II
Note 23
Homework 8 SQL, PCA (due Aug 7)

Week 8

Aug 7
Lecture 24 Decision Trees
Note 24
Discussion 14 PCA
Solution
Lab 13 Decision Trees (optional)
Aug 8
Lecture 25 Conclusion
Aug 9
Break (no lecture)
Discussion 15 Decision Trees, Final Review
Aug 10
Final Final Exam (5-7 PM)
+ Home / Schedule | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Data 100: Principles and Techniques of Data Science

UC Berkeley, Fall 2023

Ed Datahub Gradescope Extenuating Circumstances

Fernando Pérez

Fernando Pérez

He/Him/His

fernando.perez@berkeley.edu

Narges Norouzi

Narges Norouzi

She/Her/Hers

norouzi@berkeley.edu

Announcements:

Schedule

Week 1

Jun 20
Lecture 1 Course Overview
Note 1
Lab 1 Prerequisite Coding (due Jun 24)
Homework 1A Plotting and the Permutation Test (due Jun 26)
Homework 1B Prerequisite Math (due Jun 26)
Jun 21
Lecture 2 Pandas I
Note 2
Discussion 1 Math Prerequisites
Solution
Jun 22
Lecture 3 Pandas II
Note 3

Week 2

Jun 26
Lecture 4 Pandas III, EDA I
Note 4
Discussion 2 Pandas worksheet, worksheet notebook, groupwork notebook
Solution
Lab 2 Pandas (due Jul 1)
Lab 3 Data Cleaning and EDA (due Jul 1)
Homework 2 Pandas (due Jun 29)
Jun 27
Lecture 5 EDA II
Note 5
Jun 28
Lecture 6 Text Wrangling, Regex
Note 6
Discussion 3 EDA
Solution
Jun 29
Lecture 7 Visualization
Note 7
Homework 3 Tweets (due Jul 3)
Jun 30
Exam Prep 1 Pandas
Solution

Week 3

Jul 3
Break (no lecture)
Discussion 4 Regex (optional)
Solution, Video Walkthrough
Lab 4 Transformation (due Jul 8)
Lab 5 Modeling, Summary Statistics, Loss Functions (due Jul 8)
Homework 4 Bike Sharing (Visualization) (due Jul 6)
Jul 4
Independence Day (no lecture)
Jul 5
Lecture 8 Sampling
Note 8
Discussion 5 Visualization Worksheet, Notebook
Solution
Jul 6
Lecture 9 Modeling, SLR
Note 9
Homework 5A Sampling (due Jul 10)
Homework 5B Modeling (due Jul 10)
Jul 7
Exam Prep 2 Regex, KDE Plots
Solution

Week 4

Jul 10
Lecture 10 Constant model, loss, and transformations
Note 10
Discussion 6 Sampling, SLR
Solution
Lab 6 Ordinary Least Squares (due Jul 15)
Lab 7 Gradient Descent, Feature Engineering (due Jul 15)
Homework 6 Regression (due Jul 13)
Jul 11
Lecture 11 Ordinary Least Squares (Multiple Linear Regression)
Note 11
Jul 12
Lecture 12 Gradient Descent
Note 12
Discussion 7 Transformations, OLS
Solution
Jul 13
Lecture 13 Sklearn, Feature Engineering
Note 13
Project A1 Housing I (due Jul 17)

Week 5

Jul 17
Lecture 14 Case Study in Human Contexts and Ethics (CCAO)
Note 14
Discussion 8 Gradient Descent, Feature Engineering
Solution
Lab 8 Model Selection (due Jul 22)
Project A2 Housing II (due Jul 24)
Jul 18
Lecture 15 Cross-Validation, Regularization
Note 15
Jul 19
Break (no lecture)
Discussion 9 Exam Review
Jul 20
Midterm Midterm Exam (5-7 PM)

Week 6

Jul 24
Lecture 16 Random Variables
Note 16
Discussion 10 Cross-Validation, Regularization
Solution
Lab 9 Probability (due Jul 29)
Lab 10 Logistic Regression (due Jul 29)
Homework 7 Probability and Estimators (due Jul 27)
Jul 25
Lecture 17 Estimators, Bias, and Variance
Note 17
Jul 26
Lecture 18 Logistic Regression I
Note 18
Discussion 11 Random Variables, BVT
Solution
Jul 27
Lecture 19 Logistic Regression II
Note 19
Project B1 Spam & Ham I (due Jul 31)
Jul 28
Exam Prep 3 Regularization, Bias-Variance Tradeoff, Cross-Validation, Random Variables
Solution

Week 7

Jul 31
Lecture 20 SQL I
Note 20
Discussion 12 Logistic Regression
Solution
Lab 11 SQL (due Aug 5)
Lab 12 PCA (due Aug 5)
Project B2 Spam & Ham II (due Aug 3)
Aug 1
Lecture 21 SQL II
Note 21
Aug 2
Lecture 22 PCA I
Note 22
Discussion 13 SQL
Solution
Aug 3
Lecture 23 PCA II
Note 23
Homework 8 SQL, PCA (due Aug 7)

Week 8

Aug 7
Lecture 24 Decision Trees
Note 24
Discussion 14 PCA
Solution
Lab 13 Decision Trees (optional)
Aug 8
Lecture 25 Conclusion
Aug 9
Break (no lecture)
Discussion 15 Decision Trees, Final Review
Aug 10
Final Final Exam (5-7 PM)
diff --git a/_site/lecture/lec01/index.html b/_site/lecture/lec01/index.html index e6427fa..9b87724 100644 --- a/_site/lecture/lec01/index.html +++ b/_site/lecture/lec01/index.html @@ -1 +1 @@ - Lecture 1 – Course Overview | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 1 – Introduction

Presented by Bella Crouch and Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 1 – Course Overview | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 1 – Introduction

Presented by Bella Crouch and Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec02/index.html b/_site/lecture/lec02/index.html index 64a0090..ee6926b 100644 --- a/_site/lecture/lec02/index.html +++ b/_site/lecture/lec02/index.html @@ -1 +1 @@ - Lecture 2 – Pandas, Part I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 2 – Pandas, Part I

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 2 – Pandas, Part I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 2 – Pandas, Part I

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec03/index.html b/_site/lecture/lec03/index.html index dfa5ce7..912ef33 100644 --- a/_site/lecture/lec03/index.html +++ b/_site/lecture/lec03/index.html @@ -1 +1 @@ - Lecture 3 – Pandas, Part II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 3 – Pandas, Part II

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 3 – Pandas, Part II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 3 – Pandas, Part II

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec04/index.html b/_site/lecture/lec04/index.html index f6221f0..ea8dada 100644 --- a/_site/lecture/lec04/index.html +++ b/_site/lecture/lec04/index.html @@ -1 +1 @@ - Lecture 4 – Pandas, Part III and EDA, Part I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 4 – Pandas, Part III and EDA, Part I

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 4 – Pandas, Part III and EDA, Part I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 4 – Pandas, Part III and EDA, Part I

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec05/index.html b/_site/lecture/lec05/index.html index 20b7918..1cc2997 100644 --- a/_site/lecture/lec05/index.html +++ b/_site/lecture/lec05/index.html @@ -1 +1 @@ - Lecture 5 – EDA II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 5 – EDA II

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 5 – EDA II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 5 – EDA II

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec06/index.html b/_site/lecture/lec06/index.html index 6322618..68dd1d6 100644 --- a/_site/lecture/lec06/index.html +++ b/_site/lecture/lec06/index.html @@ -1 +1 @@ - Lecture 6 – Text Wrangling and Regex | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 6 – Text Wrangling and Regex

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

  • slides
  • code
  • code HTML
  • recording
    • The screen is blank for the first 15 minutes of the recording, please follow along with the slides. Sorry for any inconvenience.
    • You can also watch the last 12 minutes of the Data 100 (Spring 2023) Lecture 5 recording.
+ Lecture 6 – Text Wrangling and Regex | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 6 – Text Wrangling and Regex

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

  • slides
  • code
  • code HTML
  • recording
    • The screen is blank for the first 15 minutes of the recording, please follow along with the slides. Sorry for any inconvenience.
    • You can also watch the last 12 minutes of the Data 100 (Spring 2023) Lecture 5 recording.
diff --git a/_site/lecture/lec07/index.html b/_site/lecture/lec07/index.html index 68ef8c8..e74ecc5 100644 --- a/_site/lecture/lec07/index.html +++ b/_site/lecture/lec07/index.html @@ -1 +1 @@ - Lecture 7 – Visualization | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 7 – Visualization

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 7 – Visualization | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 7 – Visualization

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec08/index.html b/_site/lecture/lec08/index.html index c101df9..af01172 100644 --- a/_site/lecture/lec08/index.html +++ b/_site/lecture/lec08/index.html @@ -1 +1 @@ - Lecture 8 – Sampling | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 8 – Sampling

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 8 – Sampling | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 8 – Sampling

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec09/index.html b/_site/lecture/lec09/index.html index 2e7e401..a91d16b 100644 --- a/_site/lecture/lec09/index.html +++ b/_site/lecture/lec09/index.html @@ -1 +1 @@ - Lecture 9 – Modeling, SLR | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 9 – Modeling, SLR

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 9 – Modeling, SLR | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 9 – Modeling, SLR

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec10/index.html b/_site/lecture/lec10/index.html index 1e0365e..8dddd14 100644 --- a/_site/lecture/lec10/index.html +++ b/_site/lecture/lec10/index.html @@ -1 +1 @@ - Lecture 10 – Constant model, loss, and transformations | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 10 – Constant model, loss, and transformations

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 10 – Constant model, loss, and transformations | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 10 – Constant model, loss, and transformations

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec11/index.html b/_site/lecture/lec11/index.html index e6cac1c..67877b6 100644 --- a/_site/lecture/lec11/index.html +++ b/_site/lecture/lec11/index.html @@ -1 +1 @@ - Lecture 11 – Ordinary Least Squares | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 11 – Ordinary Least Squares

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 11 – Ordinary Least Squares | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 11 – Ordinary Least Squares

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec12/index.html b/_site/lecture/lec12/index.html index 7a9d254..ed37d15 100644 --- a/_site/lecture/lec12/index.html +++ b/_site/lecture/lec12/index.html @@ -1 +1 @@ - Lecture 12 – Gradient Descent | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 12 – Gradient Descent

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 12 – Gradient Descent | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 12 – Gradient Descent

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec13/index.html b/_site/lecture/lec13/index.html index 4905b0c..a2a0b0c 100644 --- a/_site/lecture/lec13/index.html +++ b/_site/lecture/lec13/index.html @@ -1 +1 @@ - Lecture 13 – Sklearn, Feature Engineering | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 13 – Sklearn, Feature Engineering

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 13 – Sklearn, Feature Engineering | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 13 – Sklearn, Feature Engineering

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec14/index.html b/_site/lecture/lec14/index.html index 3cb4f01..3a5f08b 100644 --- a/_site/lecture/lec14/index.html +++ b/_site/lecture/lec14/index.html @@ -1 +1 @@ - Lecture 14 – Case Study in Human Contexts and Ethics (CCAO) | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 14 – Case Study in Human Contexts and Ethics (CCAO)

Presented by Ari Edmundson

+ Lecture 14 – Case Study in Human Contexts and Ethics (CCAO) | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 14 – Case Study in Human Contexts and Ethics (CCAO)

Presented by Ari Edmundson

diff --git a/_site/lecture/lec15/index.html b/_site/lecture/lec15/index.html index 081202d..1256136 100644 --- a/_site/lecture/lec15/index.html +++ b/_site/lecture/lec15/index.html @@ -1 +1 @@ - Lecture 15 – Cross-Validation, Regularization | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 15 – Cross-Validation, Regularization

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 15 – Cross-Validation, Regularization | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 15 – Cross-Validation, Regularization

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec16/index.html b/_site/lecture/lec16/index.html index 1234a60..e03b24d 100644 --- a/_site/lecture/lec16/index.html +++ b/_site/lecture/lec16/index.html @@ -1 +1 @@ - Lecture 16 – Random Variables | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 16 – Random Variables

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 16 – Random Variables | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 16 – Random Variables

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec17/index.html b/_site/lecture/lec17/index.html index 2a6abcc..857111e 100644 --- a/_site/lecture/lec17/index.html +++ b/_site/lecture/lec17/index.html @@ -1 +1 @@ - Lecture 17 – Model Bias, Variance, and Inference | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 17 – Model Bias, Variance, and Inference

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 17 – Model Bias, Variance, and Inference | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 17 – Model Bias, Variance, and Inference

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec18/index.html b/_site/lecture/lec18/index.html index 246045c..4ce8905 100644 --- a/_site/lecture/lec18/index.html +++ b/_site/lecture/lec18/index.html @@ -1 +1 @@ - Lecture 18 – Logistic Regression I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 18 – Logistic Regression I

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 18 – Logistic Regression I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 18 – Logistic Regression I

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec19/index.html b/_site/lecture/lec19/index.html index aac8614..0d23cf8 100644 --- a/_site/lecture/lec19/index.html +++ b/_site/lecture/lec19/index.html @@ -1 +1 @@ - Lecture 19 – Logistic Regression II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 19 – Logistic Regression II

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 19 – Logistic Regression II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 19 – Logistic Regression II

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec20/index.html b/_site/lecture/lec20/index.html index f6c6ce1..8599a23 100644 --- a/_site/lecture/lec20/index.html +++ b/_site/lecture/lec20/index.html @@ -1 +1 @@ - Lecture 20 – SQL I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 20 – SQL I

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 20 – SQL I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 20 – SQL I

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec21/index.html b/_site/lecture/lec21/index.html index 1e055c4..759adc1 100644 --- a/_site/lecture/lec21/index.html +++ b/_site/lecture/lec21/index.html @@ -1 +1 @@ - Lecture 21 – SQL II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 21 – SQL II

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 21 – SQL II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 21 – SQL II

Presented by Bella Crouch

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec22/index.html b/_site/lecture/lec22/index.html index bbef8d5..3b44da6 100644 --- a/_site/lecture/lec22/index.html +++ b/_site/lecture/lec22/index.html @@ -1 +1 @@ - Lecture 22 – PCA I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 22 – PCA I

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 22 – PCA I | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 22 – PCA I

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec23/index.html b/_site/lecture/lec23/index.html index 3ecfcaf..dbf5748 100644 --- a/_site/lecture/lec23/index.html +++ b/_site/lecture/lec23/index.html @@ -1 +1 @@ - Lecture 23 – PCA II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 23 – PCA II

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 23 – PCA II | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 23 – PCA II

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec24/index.html b/_site/lecture/lec24/index.html index 564a2dc..b70563c 100644 --- a/_site/lecture/lec24/index.html +++ b/_site/lecture/lec24/index.html @@ -1 +1 @@ - Lecture 24 – Decision trees | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 24 - Decision Trees

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 24 – Decision trees | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 24 - Decision Trees

Presented by Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/lecture/lec25/index.html b/_site/lecture/lec25/index.html index a22046c..9202b15 100644 --- a/_site/lecture/lec25/index.html +++ b/_site/lecture/lec25/index.html @@ -1 +1 @@ - Lecture 25 – Conclusion | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 25 - Conclusion

Presented by Bella Crouch and Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

+ Lecture 25 – Conclusion | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Lecture 25 - Conclusion

Presented by Bella Crouch and Dominic Liu

Content by many dedicated Data 100 instructors at UC Berkeley. See our Acknowledgments page.

diff --git a/_site/resources/assets/staff_pics/README/index.html b/_site/resources/assets/staff_pics/README/index.html index f271d82..0574506 100644 --- a/_site/resources/assets/staff_pics/README/index.html +++ b/_site/resources/assets/staff_pics/README/index.html @@ -1 +1 @@ - Staff Pictures | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Staff Pictures

Staff pictures go here

+ Staff Pictures | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Staff Pictures

Staff pictures go here

diff --git a/_site/resources/index.html b/_site/resources/index.html index c627f4d..6545875 100644 --- a/_site/resources/index.html +++ b/_site/resources/index.html @@ -1 +1 @@ - Resources | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Resources

Here is a collection of resources that will help you learn more about various concepts and skills covered in the class. Learning by reading is a key part of being a well rounded data scientist. We will not assign mandatory reading but instead encourage you to look at these and other materials. If you find something helpful, post it on EdStem, and consider contributing it to the course website.

Jump to:

Supplementary Course Notes

Alongside each lecture are supplementary Course Notes.

Lecture notes will be updated on a weekly basis, prior to the lecture. If you spot any errors or would like to suggest any changes, please email us at data100.instructors@berkeley.edu.

Optional Supplementary Textbook

Alongside each lecture are optional textbook readings to the Data 100 textbook, Principles and Techniques of Data Science. Textbook readings are purely supplementary, and may contain material that is not in scope (and may also not be comprehensive).

Exam Resources

Course Website

We will be posting all lecture materials on the course syllabus. In addition, they will also be listed in the following publicly visible Github Repo.

You can send us changes to the course website by forking and sending a pull request to the course website github repository. You will then become part of the history of Data 100 at Berkeley.

Coding and Mathematics Resources

Pandas

SQL

  • We’ve assembled some SQL Review Slides to help you brush up on SQL.
  • We’ve also compiled a list of SQL practice problems, which can be found here, along with their solutions.
  • This SQL Cheat Sheet is an awesome resource that was created by Luke Harrison, a former Data 100 student.

Regex

  • Regex101.com. Remember to select the Python flavour of Regex!
  • DS100 Reference Sheet
  • We’ve organized some regular expressions(regex) problems to help you get extra practice on regex in a notebook format. They can be found here, along with their solutions.
  • The official Python3 regex guide is good: link

LaTeX

Other Web References

As a data scientist you will often need to search for information on various libraries and tools. In this class we will be using several key python libraries. Here are their documentation pages:

Calculus and Linear Algebra

Note: None of these resources are meant to be a substitute for the appropriate requirement / co-requisite (Math 54, etc.). If you have no familiarity whatsoever with either of these topics, these may not be adequate and we strongly recommend spending time covering the prerequisite material yourself. We will assume that you have prior knowledge of these requirements and that these resources are simply to refresh your memory of concepts that you have previously learned. Please reach out to staff if you have any questions or concerns about this.

Calculus: In terms of calculus, you will need to know a few things, most of which are covered within the space of the first homework and lab. Specifically, you will need to know univariate calculus rules like: Taking derivatives of a univariate function (i.e. f(x), where x is the only variable); Derivative power rule; Knowing derivatives of mathematical functions like: sinx,cosx,logx,ex; Chain rule; Product rule (rarely); Derivatives of sums. We will expect some multivariate fluency like: Taking partial derivatives of a multivariate function (i.e. f(x,y,z), where x,y,z are all variables); Gradients (the concept).

Linear Algebra:

Concepts roughly in order of importance: vectors, matrices; rank/nullity; inner products, orthogonality, norms; linear independence; orthonormal matrices; vector spaces; projections; invertibility.

Probability

  • We’ve compiled a few practice probability problems that we believe may help in understanding the ideas covered in the course. They can be found here, along with their solutions.
  • We’d also like to point you to the textbook for Data C88S, an introductory probability course geared towards data science students at Berkeley.

Books

Because data science is a relatively new and rapidly evolving discipline there is no single ideal textbook for this subject. Instead we plan to use reading from a collection of books all of which are free. However, we have listed a few optional books that will provide additional context for those who are interested.

Wellness Resources

Your well-being matters, and we hope that Data 100 is never a barrier to taking care of your mental and physical health. Below are some campus resources that may be helpful.

COVID-19 Resources and Support

You can find UC Berkeley’ COVID-19 resources and support here.

For academic performance, support, and technology

The Center for Access to Engineering Excellence (Bechtel Engineering Center 227) is an inclusive center that offers study spaces, nutritious snacks, and tutoring in >50 courses for Berkeley engineers and other majors across campus. The Center also offers a wide range of professional development, leadership, and wellness programs, and loans iclickers, laptops, and professional attire for interviews.

As the primary academic support service for undergraduates at UC Berkeley, the Student Learning Center (510-642-7332) assists students in transitioning to Cal, navigating the academic terrain, creating networks of resources, and achieving academic, personal, and professional goals. Through various services including tutoring, study groups, workshops, and courses, SLC supports undergraduate students in Biological and Physical Sciences, Business Administration, Computer Science, Economics, Mathematics, Social Sciences, Statistics, Study Strategies, and Writing.

The Educational Opportunity Program (EOP, Cesar Chavez Student Center 119; 510-642-7224) at Cal has provided first generation and low income college students with the guidance and resources necessary to succeed at the best public university in the world. EOP’s individualized academic counseling, support services, and extensive campus referral network help students develop the unique gifts and talents they each bring to the university while empowering them to achieve.

Students can access device lending options through the Student Technology Equity Program (STEP) program.

For mental well-being

The staff of the UHS Counseling and Psychological Services (Tang Center, 2222 Bancroft Way; 510-642-9494; for after-hours support, please call the 24/7 line at 855-817-5667) provides confidential, brief counseling and crisis intervention to students with personal, academic and career stress. Services are provided by a multicultural group of professional counselors including psychologists, social workers, and advanced level trainees. All undergraduate and graduate students are eligible for CAPS services, regardless of insurance coverage.

To improve access for engineering students, a licensed psychologist from the Tang Center also holds walk-in appointments for confidential counseling in Bechtel Engineering Center 241 (check here for schedule).

For disability accommodations

The Disabled Students’ Program (DSP, 260 César Chávez Student Center #4250; 510-642-0518) serves students with disabilities of all kinds, including mobility impairments, blind or low vision, deaf or hard of hearing; chronic illnesses (chronic pain, repetitive strain injuries, brain injuries, AIDS/HIV, cancer, etc.) psychological disabilities (bipolar disorder, severe anxiety or depression, etc.), Attention Deficit Disorder/Attention Deficit Hyperactivity Disorder, and Learning Disabilities. Services are individually designed and based on the specific needs of each student as identified by DSP’s Specialists. The Program’s official website includes information on DSP staff, UCB’s disabilities policy, application procedures, campus access guides for most university buildings, and portals for students and faculty.

For solving a dispute

The Ombudsperson for Students (Sproul Hall 102; 510-642-5754) provides a confidential service for students involved in a University-related problem (academic or administrative), acting as a neutral complaint resolver and not as an advocate for any of the parties involved in a dispute. The Ombudsperson can provide information on policies and procedures affecting students, facilitate students’ contact with services able to assist in resolving the problem, and assist students in complaints concerning improper application of University policies or procedures. All matters referred to this office are held in strict confidence. The only exceptions, at the sole discretion of the Ombudsperson, are cases where there appears to be imminent threat of serious harm.

The Student Advocate’s Office (SAO) is an executive, non-partisan office of the ASUC. We offer free, confidential casework services and resources to any student(s) navigating issues with the University, including academic, conduct, financial aid, and grievance concerns. All support is centered around students and aims for an equity-based approach.

For recovery from sexual harassment or sexual assault

The Care Line (510-643-2005) is a 24/7, confidential, free, campus-based resource for urgent support around sexual assault, sexual harassment, interpersonal violence, stalking, and invasion of sexual privacy. The Care Line will connect you with a confidential advocate for trauma-informed crisis support including time-sensitive information, securing urgent safety resources, and accompaniment to medical care or reporting.

For social services

Social Services provides confidential services and counseling to help students with managing problems that can emerge from illness such as financial, academic, legal, family concerns, and more. They specialize in helping students with pregnancy resources and referrals; alcohol/drug problems related to one’s own or a family member’s use; sexual assault/rape; relationship or other violence; and support for health concerns-new diagnoses or ongoing conditions. Social Services staff will assess a student’s immediate needs, work with the student to develop a plan to meet those needs, and facilitate arrangements with academic departments and advocate for the student with other campus offices and community agencies, as well as coordinate services within UHS.

For finding community on campus

The mission of the Berkeley International Office (2299 Piedmont Avenue, 510-642-2818) is to provide support with all the essential resources needed to not only survive, but thrive here at UC Berkeley. Their mission is to support you and work together towards justice and belonging for all. They define Basic Needs as the essential resources that impact your health, belonging, persistence, and overall well being. It is an ecosystem that includes: nutritious food, stable housing, hygiene, transportation, healthcare, mental wellness, financial sustainability, sleep, and emergency dependent services. They refuse to accept hunger, homelessness, and all other basic needs injustices as part of our university.

The Gender Equity Resource Center, fondly referred to as GenEq, is a UC Berkeley campus community center committed to fostering an inclusive Cal experience for all. GenEq is the campus location where students, faculty, staff and Alumni connect for resources, services, education and leadership programs related to gender and sexuality. The programs and services of the Gender Equity Resource Center are focused into four key areas: women; lesbian, gay, bisexual, and transgender (LGBT); sexual and dating violence; and hate crimes and bias driven incidents. GenEq strives to provide a space for respectful dialogue about sexuality and gender; illuminate the interrelationship of sexism, homophobia and gender bias and violence; create a campus free of violence and hate; provide leadership opportunities; advocate on behalf of survivors of sexual, hate, dating and gender violence; foster a community of women and LGBT leaders; and be a portal to campus and community resources on LGBT, Women, and the many intersections of identity (e.g., race, class, ability, etc.).

The Undocumented Students Program (119 Cesar Chavez Center; 642-7224) practices a holistic, multicultural and solution-focused approach that delivers individualized service for each student. The academic counseling, legal support, financial aid resources and extensive campus referral network provided by USP helps students develop the unique gifts and talents they each bring to the university, while empowering a sense of belonging. The program’s mission is to support the advancement of undocumented students within higher education and promote pathways for engaged scholarship.

The Multicultural Education Program (MEP) is one of six initiatives funded by the Evelyn and Walter Haas, Jr. Fund to work towards institutional change and to create a positive campus climate for diversity. The MEP is a five-year initiative to establish a sustainable infrastructure for activities like educational consultation and diversity workshops for the campus that address both specific topics, and to cater to group needs across the campus.

For basic needs (food, shelter, etc.)

The Basic Needs Center (lower level of MLK Student Union, Suite 72) provides support with all the essential resources needed to not only survive, but thrive here at UC Berkeley. Their mission is to support you and work together towards justice and belonging for all. They define Basic Needs as the essential resources that impact your health, belonging, persistence, and overall well being. It is an ecosystem that includes: nutritious food, stable housing, hygiene, transportation, healthcare, mental wellness, financial sustainability, sleep, and emergency dependent services. They refuse to accept hunger, homelessness, and all other basic needs injustices as part of our university.

The UC Berkeley Food Pantry (#68 Martin Luther King Student Union) aims to reduce food insecurity among students and staff at UC Berkeley, especially the lack of nutritious food. Students and staff can visit the pantry as many times as they need and take as much as they need while being mindful that it is a shared resource. The pantry operates on a self-assessed need basis; there are no eligibility requirements. The pantry is not for students and staff who need supplemental snacking food, but rather, core food support.

Data Science Education

Interested in bringing the Data Science major or curriculum to your academic institution? Please fill out this form if you would like support from Berkeley in offering some variant of our Data Science courses at your institution (or just to let us know that you’re interested). Information about the courses appear at data8.org and ds100.org. Please note that this form is only for instructors. If you are only interested in learning Python or data science, please look at our Data 8 or Data 100 websites mentioned above.

Local Setup (Old)

NOTE: This section is out of date and no longer supported by the course staff.

Click here to read our guide on how to set up our development environment locally (as an alternative to using DataHub). Please note that any autograder tests will only work on DataHub.

+ Resources | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Resources

Here is a collection of resources that will help you learn more about various concepts and skills covered in the class. Learning by reading is a key part of being a well rounded data scientist. We will not assign mandatory reading but instead encourage you to look at these and other materials. If you find something helpful, post it on EdStem, and consider contributing it to the course website.

Jump to:

Supplementary Course Notes

Alongside each lecture are supplementary Course Notes.

Lecture notes will be updated on a weekly basis, prior to the lecture. If you spot any errors or would like to suggest any changes, please email us at data100.instructors@berkeley.edu.

Optional Supplementary Textbook

Alongside each lecture are optional textbook readings to the Data 100 textbook, Principles and Techniques of Data Science. Textbook readings are purely supplementary, and may contain material that is not in scope (and may also not be comprehensive).

Exam Resources

Course Website

We will be posting all lecture materials on the course syllabus. In addition, they will also be listed in the following publicly visible Github Repo.

You can send us changes to the course website by forking and sending a pull request to the course website github repository. You will then become part of the history of Data 100 at Berkeley.

Coding and Mathematics Resources

Pandas

SQL

  • We’ve assembled some SQL Review Slides to help you brush up on SQL.
  • We’ve also compiled a list of SQL practice problems, which can be found here, along with their solutions.
  • This SQL Cheat Sheet is an awesome resource that was created by Luke Harrison, a former Data 100 student.

Regex

  • Regex101.com. Remember to select the Python flavour of Regex!
  • DS100 Reference Sheet
  • We’ve organized some regular expressions(regex) problems to help you get extra practice on regex in a notebook format. They can be found here, along with their solutions.
  • The official Python3 regex guide is good: link

LaTeX

Other Web References

As a data scientist you will often need to search for information on various libraries and tools. In this class we will be using several key python libraries. Here are their documentation pages:

Calculus and Linear Algebra

Note: None of these resources are meant to be a substitute for the appropriate requirement / co-requisite (Math 54, etc.). If you have no familiarity whatsoever with either of these topics, these may not be adequate and we strongly recommend spending time covering the prerequisite material yourself. We will assume that you have prior knowledge of these requirements and that these resources are simply to refresh your memory of concepts that you have previously learned. Please reach out to staff if you have any questions or concerns about this.

Calculus: In terms of calculus, you will need to know a few things, most of which are covered within the space of the first homework and lab. Specifically, you will need to know univariate calculus rules like: Taking derivatives of a univariate function (i.e. f(x), where x is the only variable); Derivative power rule; Knowing derivatives of mathematical functions like: sinx,cosx,logx,ex; Chain rule; Product rule (rarely); Derivatives of sums. We will expect some multivariate fluency like: Taking partial derivatives of a multivariate function (i.e. f(x,y,z), where x,y,z are all variables); Gradients (the concept).

Linear Algebra:

Concepts roughly in order of importance: vectors, matrices; rank/nullity; inner products, orthogonality, norms; linear independence; orthonormal matrices; vector spaces; projections; invertibility.

Probability

  • We’ve compiled a few practice probability problems that we believe may help in understanding the ideas covered in the course. They can be found here, along with their solutions.
  • We’d also like to point you to the textbook for Data C88S, an introductory probability course geared towards data science students at Berkeley.

Books

Because data science is a relatively new and rapidly evolving discipline there is no single ideal textbook for this subject. Instead we plan to use reading from a collection of books all of which are free. However, we have listed a few optional books that will provide additional context for those who are interested.

Wellness Resources

Your well-being matters, and we hope that Data 100 is never a barrier to taking care of your mental and physical health. Below are some campus resources that may be helpful.

COVID-19 Resources and Support

You can find UC Berkeley’ COVID-19 resources and support here.

For academic performance, support, and technology

The Center for Access to Engineering Excellence (Bechtel Engineering Center 227) is an inclusive center that offers study spaces, nutritious snacks, and tutoring in >50 courses for Berkeley engineers and other majors across campus. The Center also offers a wide range of professional development, leadership, and wellness programs, and loans iclickers, laptops, and professional attire for interviews.

As the primary academic support service for undergraduates at UC Berkeley, the Student Learning Center (510-642-7332) assists students in transitioning to Cal, navigating the academic terrain, creating networks of resources, and achieving academic, personal, and professional goals. Through various services including tutoring, study groups, workshops, and courses, SLC supports undergraduate students in Biological and Physical Sciences, Business Administration, Computer Science, Economics, Mathematics, Social Sciences, Statistics, Study Strategies, and Writing.

The Educational Opportunity Program (EOP, Cesar Chavez Student Center 119; 510-642-7224) at Cal has provided first generation and low income college students with the guidance and resources necessary to succeed at the best public university in the world. EOP’s individualized academic counseling, support services, and extensive campus referral network help students develop the unique gifts and talents they each bring to the university while empowering them to achieve.

Students can access device lending options through the Student Technology Equity Program (STEP) program.

For mental well-being

The staff of the UHS Counseling and Psychological Services (Tang Center, 2222 Bancroft Way; 510-642-9494; for after-hours support, please call the 24/7 line at 855-817-5667) provides confidential, brief counseling and crisis intervention to students with personal, academic and career stress. Services are provided by a multicultural group of professional counselors including psychologists, social workers, and advanced level trainees. All undergraduate and graduate students are eligible for CAPS services, regardless of insurance coverage.

To improve access for engineering students, a licensed psychologist from the Tang Center also holds walk-in appointments for confidential counseling in Bechtel Engineering Center 241 (check here for schedule).

For disability accommodations

The Disabled Students’ Program (DSP, 260 César Chávez Student Center #4250; 510-642-0518) serves students with disabilities of all kinds, including mobility impairments, blind or low vision, deaf or hard of hearing; chronic illnesses (chronic pain, repetitive strain injuries, brain injuries, AIDS/HIV, cancer, etc.) psychological disabilities (bipolar disorder, severe anxiety or depression, etc.), Attention Deficit Disorder/Attention Deficit Hyperactivity Disorder, and Learning Disabilities. Services are individually designed and based on the specific needs of each student as identified by DSP’s Specialists. The Program’s official website includes information on DSP staff, UCB’s disabilities policy, application procedures, campus access guides for most university buildings, and portals for students and faculty.

For solving a dispute

The Ombudsperson for Students (Sproul Hall 102; 510-642-5754) provides a confidential service for students involved in a University-related problem (academic or administrative), acting as a neutral complaint resolver and not as an advocate for any of the parties involved in a dispute. The Ombudsperson can provide information on policies and procedures affecting students, facilitate students’ contact with services able to assist in resolving the problem, and assist students in complaints concerning improper application of University policies or procedures. All matters referred to this office are held in strict confidence. The only exceptions, at the sole discretion of the Ombudsperson, are cases where there appears to be imminent threat of serious harm.

The Student Advocate’s Office (SAO) is an executive, non-partisan office of the ASUC. We offer free, confidential casework services and resources to any student(s) navigating issues with the University, including academic, conduct, financial aid, and grievance concerns. All support is centered around students and aims for an equity-based approach.

For recovery from sexual harassment or sexual assault

The Care Line (510-643-2005) is a 24/7, confidential, free, campus-based resource for urgent support around sexual assault, sexual harassment, interpersonal violence, stalking, and invasion of sexual privacy. The Care Line will connect you with a confidential advocate for trauma-informed crisis support including time-sensitive information, securing urgent safety resources, and accompaniment to medical care or reporting.

For social services

Social Services provides confidential services and counseling to help students with managing problems that can emerge from illness such as financial, academic, legal, family concerns, and more. They specialize in helping students with pregnancy resources and referrals; alcohol/drug problems related to one’s own or a family member’s use; sexual assault/rape; relationship or other violence; and support for health concerns-new diagnoses or ongoing conditions. Social Services staff will assess a student’s immediate needs, work with the student to develop a plan to meet those needs, and facilitate arrangements with academic departments and advocate for the student with other campus offices and community agencies, as well as coordinate services within UHS.

For finding community on campus

The mission of the Berkeley International Office (2299 Piedmont Avenue, 510-642-2818) is to provide support with all the essential resources needed to not only survive, but thrive here at UC Berkeley. Their mission is to support you and work together towards justice and belonging for all. They define Basic Needs as the essential resources that impact your health, belonging, persistence, and overall well being. It is an ecosystem that includes: nutritious food, stable housing, hygiene, transportation, healthcare, mental wellness, financial sustainability, sleep, and emergency dependent services. They refuse to accept hunger, homelessness, and all other basic needs injustices as part of our university.

The Gender Equity Resource Center, fondly referred to as GenEq, is a UC Berkeley campus community center committed to fostering an inclusive Cal experience for all. GenEq is the campus location where students, faculty, staff and Alumni connect for resources, services, education and leadership programs related to gender and sexuality. The programs and services of the Gender Equity Resource Center are focused into four key areas: women; lesbian, gay, bisexual, and transgender (LGBT); sexual and dating violence; and hate crimes and bias driven incidents. GenEq strives to provide a space for respectful dialogue about sexuality and gender; illuminate the interrelationship of sexism, homophobia and gender bias and violence; create a campus free of violence and hate; provide leadership opportunities; advocate on behalf of survivors of sexual, hate, dating and gender violence; foster a community of women and LGBT leaders; and be a portal to campus and community resources on LGBT, Women, and the many intersections of identity (e.g., race, class, ability, etc.).

The Undocumented Students Program (119 Cesar Chavez Center; 642-7224) practices a holistic, multicultural and solution-focused approach that delivers individualized service for each student. The academic counseling, legal support, financial aid resources and extensive campus referral network provided by USP helps students develop the unique gifts and talents they each bring to the university, while empowering a sense of belonging. The program’s mission is to support the advancement of undocumented students within higher education and promote pathways for engaged scholarship.

The Multicultural Education Program (MEP) is one of six initiatives funded by the Evelyn and Walter Haas, Jr. Fund to work towards institutional change and to create a positive campus climate for diversity. The MEP is a five-year initiative to establish a sustainable infrastructure for activities like educational consultation and diversity workshops for the campus that address both specific topics, and to cater to group needs across the campus.

For basic needs (food, shelter, etc.)

The Basic Needs Center (lower level of MLK Student Union, Suite 72) provides support with all the essential resources needed to not only survive, but thrive here at UC Berkeley. Their mission is to support you and work together towards justice and belonging for all. They define Basic Needs as the essential resources that impact your health, belonging, persistence, and overall well being. It is an ecosystem that includes: nutritious food, stable housing, hygiene, transportation, healthcare, mental wellness, financial sustainability, sleep, and emergency dependent services. They refuse to accept hunger, homelessness, and all other basic needs injustices as part of our university.

The UC Berkeley Food Pantry (#68 Martin Luther King Student Union) aims to reduce food insecurity among students and staff at UC Berkeley, especially the lack of nutritious food. Students and staff can visit the pantry as many times as they need and take as much as they need while being mindful that it is a shared resource. The pantry operates on a self-assessed need basis; there are no eligibility requirements. The pantry is not for students and staff who need supplemental snacking food, but rather, core food support.

Data Science Education

Interested in bringing the Data Science major or curriculum to your academic institution? Please fill out this form if you would like support from Berkeley in offering some variant of our Data Science courses at your institution (or just to let us know that you’re interested). Information about the courses appear at data8.org and ds100.org. Please note that this form is only for instructors. If you are only interested in learning Python or data science, please look at our Data 8 or Data 100 websites mentioned above.

Local Setup (Old)

NOTE: This section is out of date and no longer supported by the course staff.

Click here to read our guide on how to set up our development environment locally (as an alternative to using DataHub). Please note that any autograder tests will only work on DataHub.

diff --git a/_site/setup/index.html b/_site/setup/index.html index eb70c96..2488970 100644 --- a/_site/setup/index.html +++ b/_site/setup/index.html @@ -1,4 +1,4 @@ - Local Setup | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

Local Setup

We will still be using datahub as our primary computing environment. This page serves as a guide for alternative environment setup.

In other words: you don’t have to follow these instructions unless you’d like an alternative to datahub.

Contents

OSX

  1. You will need access to the command line. On a Mac, you can open the Terminal by opening Spotlight (Cmd + Space) and typing "Terminal". Alternatively, you can go to your Applications screen and select Terminal (it might be in the folder named "Other")

  2. Homebrew is a package manager for OSX. If you haven’t already, install it by running the following in the command line (copy, paste, and enter):

     # This downloads the Ruby code of the installation script and runs it
    +           Local Setup | Data 100                 Skip to main content   Link      Menu      Expand       (external link)    Document      Search       Copy       Copied        

    Local Setup

    We will still be using datahub as our primary computing environment. This page serves as a guide for alternative environment setup.

    In other words: you don’t have to follow these instructions unless you’d like an alternative to datahub.

    Contents

    OSX

    1. You will need access to the command line. On a Mac, you can open the Terminal by opening Spotlight (Cmd + Space) and typing "Terminal". Alternatively, you can go to your Applications screen and select Terminal (it might be in the folder named "Other")

    2. Homebrew is a package manager for OSX. If you haven’t already, install it by running the following in the command line (copy, paste, and enter):

       # This downloads the Ruby code of the installation script and runs it
        /usr/bin/ruby -e "$(curl -fsSL https://raw.githubusercontent.com/Homebrew/install/master/install)"
       

      Verify your installation by making sure brew --version doesn’t error at your terminal.

    3. Download and install Anaconda:

      # Uses curl to download the installation script
       curl https://repo.continuum.io/miniconda/Miniconda2-4.5.11-MacOSX-x86_64.sh > miniconda.sh
      diff --git a/_site/staff/index.html b/_site/staff/index.html
      index 34600da..80c09e1 100644
      --- a/_site/staff/index.html
      +++ b/_site/staff/index.html
      @@ -1 +1 @@
      -           Staff | Data 100                 Skip to main content   Link      Menu      Expand       (external link)    Document      Search       Copy       Copied        

      Staff

      Jump to: Instructors, Teaching Assistants, Readers.

      Note: Consult the calendar for the most up-to-date office hours for each GSI. All GSI Office Hours will be held in Warren 101B.

      Course Staff Email

      Contact course staff via Ed with any questions or concerns. For sensitive matters, the staff email address data100.instructors@berkeley.edu is monitored by the instructors and a few lead TAs.

      Instructors

      Bella Crouch

      Bella Crouch

      She/Her/Hers

      isabella.crouch@berkeley.edu

      Office Hours: Tue, Th 3-4pm (Warren 111)

      Dominic Liu

      Dominic Liu

      He/Him/His

      hangxingliu@berkeley.edu

      Office Hours: Mon, Wed 3-4pm (Warren 111)

      Teaching Assistants

      Alan Jian

      Alan Jian

      He/Him/His

      alanjian131@berkeley.edu

      Office Hours: Mon, Wed 1-3

      Hi there, my name is Alan and I’m a 5th year MIDS student with a background in natural language processing and an interest in data engineering and data ethics. When I’m not doing data things, you’ll either find me playing tennis at the Hearst courts or curled up at home with a good book :)

      Bennett Somerville

      Bennett Somerville

      He/Him/His

      bdsomer@berkeley.edu

      Office Hours: Mon, Tue 1-3

      I’m a rising third-year undergraduate student majoring in computer science. I enjoy writing code, teaching, cycling, repairing bikes, playing music, and learning languages, among other things. Feel free to reach out!

      Celine Choi

      Celine Choi

      She/Her/Hers

      celinejwchoi@berkeley.edu

      Office Hours: Mon, Wed 1-3

      Hey everyone! I am a rising junior studying CS. This is my second year on course staff and I’m super stoked to meet you all :)

      Mihran Miroyan

      Mihran Miroyan

      He/Him/His

      miroyan.mihran@berkeley.edu

      Office Hours: Mon, Thu 3-5

      Hey, I am Mir!

      Milad Shafaie

      Milad Shafaie

      He/Him/His

      mshafaie@berkeley.edu

      Office Hours: Tue 4-5, Wed 3-5, Thu 1-2

      Hello

      Nathan Harounian

      Nathan Harounian

      He/Him/His

      nathanharounian@berkeley.edu

      Office Hours: Fri 12-4

      Hey! I’m a senior studying Statistics and Data Science. In my free time, I enjoy hanging out with my friends, listening to music, archery, and poker! I really enjoyed taking Data 100 last summer and look forward to helping y’all this summer :)

      Stephanie Xu

      Stephanie Xu

      She/Her/Hers

      stephanie.xu@berkeley.edu

      Office Hours: Mon 11-1, Tue 12-1, Wed 12-1

      Hi! I’m a CS and Data Science double major and I’m super excited to be one of your uGSIs! Feel free to reach out to me if you have any questions regarding the course or simply want someone to talk to!

      Tina Chen

      Tina Chen

      She/Her/Hers

      czz129@berkeley.edu

      Office Hours: Thu, Fri 1-3

      Hi Everyone! I’am Tina a rising senior majoring DS + stats. I’m super exicting to meet with everyone. Feel free to reach out to me for any questions! :)))

      Yash Dave

      Yash Dave

      He/Him/His

      yashdave003@berkeley.edu

      Office Hours: Mon 12-1, Tue 12-2, Wed 12-1

      Hi! I’m Yash, a rising junior majoring in Applied Math and CS with a minor in Public Policy. Excited to be teaching Data 100 over the summer!!

      Yuerou Tang

      Yuerou Tang

      They/Them/Theirs

      yuerou.tang@berkeley.edu

      Hi! I’m a senior studying CS and Conservation & Resource Studies. Check out my website for cool bird pictures I took!!

      Zaid Maayah

      Zaid Maayah

      He/Him/His

      zaidmaayah@berkeley.edu

      Office Hours: Tue, Thu 2-4

      Hi everyone! I’m a rising fourth-year international student from Jordan, double majoring in Data science and Linguistics. I like traveling, compiling playlists, and rating every restaurant in Berkeley. I hope you enjoy the course!

      Readers

      Aneesh Durai

      Aneesh Durai

      He/Him/His

      aneesh.durai@berkeley.edu

      Hi! I’m Aneesh, and I’m very excited to be working with you this summer!

      Anthony Zhang

      Anthony Zhang

      He/Him/His

      anthony_zhang1234@berkeley.edu

      yooo it’s anthony - im an expert in bonking on my bike, entering food coma, and tripping myself in dance dance revolution. i like to study quik mafs and cs

      Archer Parry

      Archer Parry

      He/Him/His

      archerp@berkeley.edu

      Hi, I am a rising senior that enjoys hanging out with friends and playing games in my free time.

      Asbah Wasim

      Asbah Wasim

      She/Her/Hers

      asbahwasim@berkeley.edu

      Hi there, welcome to Data 100! I am a rising junior studying Cognitive Science and Data Science. In my free time, I enjoy drawing nature, painting scenery, organizing, and going on walks. I look forward to meeting you over the summer, and hope you have a great time in the class!

      Hans Mao

      Hans Mao

      He/Him/His

      huanzhimao@berkeley.edu

      Hello! I’m a rising junior majoring in CS and Stat. I’m interested in computer security, distributed systems, and machine learning. I <3 Data 100! Besides teaching, I enjoy sailing, hiking, and swimming. Looking forward to an awesome semester :o (Generated by ChatGPT)

      Matthew Lee

      Matthew Lee

      He/Him/His

      matthewlee3@berkeley.edu

      hey i’m matthew and i like great vibes. please hit me up if you have a life changing restaurant.

      Yehchan Yoo

      Yehchan Yoo

      He/Him/His

      yehchanyoo@berkeley.edu

      Hello — I am a senior majoring in Statistics and Political Economy & minoring in Data Science; I like to read the news, watch YouTube videos, listen to rock and electronic music, mediate, lift weights, and do boxing in my free time. Hope you all will enjoy the course, and always feel free to reach out!

      + Staff | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

      Staff

      Jump to: Instructors, Teaching Assistants, Readers.

      Note: Consult the calendar for the most up-to-date office hours for each GSI. All GSI Office Hours will be held in Warren 101B.

      Course Staff Email

      Contact course staff via Ed with any questions or concerns. For sensitive matters, the staff email address data100.instructors@berkeley.edu is monitored by the instructors and a few lead TAs.

      Instructors

      Fernando Pérez

      Fernando Pérez

      He/Him/His

      fernando.perez@berkeley.edu

      Narges Norouzi

      Narges Norouzi

      She/Her/Hers

      norouzi@berkeley.edu

      Teaching Assistants

      Alan Jian

      Alan Jian

      He/Him/His

      alanjian131@berkeley.edu

      Office Hours: Mon, Wed 1-3

      Hi there, my name is Alan and I’m a 5th year MIDS student with a background in natural language processing and an interest in data engineering and data ethics. When I’m not doing data things, you’ll either find me playing tennis at the Hearst courts or curled up at home with a good book :)

      Bennett Somerville

      Bennett Somerville

      He/Him/His

      bdsomer@berkeley.edu

      Office Hours: Mon, Tue 1-3

      I’m a rising third-year undergraduate student majoring in computer science. I enjoy writing code, teaching, cycling, repairing bikes, playing music, and learning languages, among other things. Feel free to reach out!

      Celine Choi

      Celine Choi

      She/Her/Hers

      celinejwchoi@berkeley.edu

      Office Hours: Mon, Wed 1-3

      Hey everyone! I am a rising junior studying CS. This is my second year on course staff and I’m super stoked to meet you all :)

      Mihran Miroyan

      Mihran Miroyan

      He/Him/His

      miroyan.mihran@berkeley.edu

      Office Hours: Mon, Thu 3-5

      Hey, I am Mir!

      Milad Shafaie

      Milad Shafaie

      He/Him/His

      mshafaie@berkeley.edu

      Office Hours: Tue 4-5, Wed 3-5, Thu 1-2

      Hello

      Nathan Harounian

      Nathan Harounian

      He/Him/His

      nathanharounian@berkeley.edu

      Office Hours: Fri 12-4

      Hey! I’m a senior studying Statistics and Data Science. In my free time, I enjoy hanging out with my friends, listening to music, archery, and poker! I really enjoyed taking Data 100 last summer and look forward to helping y’all this summer :)

      Stephanie Xu

      Stephanie Xu

      She/Her/Hers

      stephanie.xu@berkeley.edu

      Office Hours: Mon 11-1, Tue 12-1, Wed 12-1

      Hi! I’m a CS and Data Science double major and I’m super excited to be one of your uGSIs! Feel free to reach out to me if you have any questions regarding the course or simply want someone to talk to!

      Tina Chen

      Tina Chen

      She/Her/Hers

      czz129@berkeley.edu

      Office Hours: Thu, Fri 1-3

      Hi Everyone! I’am Tina a rising senior majoring DS + stats. I’m super exicting to meet with everyone. Feel free to reach out to me for any questions! :)))

      Yash Dave

      Yash Dave

      He/Him/His

      yashdave003@berkeley.edu

      Office Hours: Mon 12-1, Tue 12-2, Wed 12-1

      Hi! I’m Yash, a rising junior majoring in Applied Math and CS with a minor in Public Policy. Excited to be teaching Data 100 over the summer!!

      Yuerou Tang

      Yuerou Tang

      They/Them/Theirs

      yuerou.tang@berkeley.edu

      Hi! I’m a senior studying CS and Conservation & Resource Studies. Check out my website for cool bird pictures I took!!

      Zaid Maayah

      Zaid Maayah

      He/Him/His

      zaidmaayah@berkeley.edu

      Office Hours: Tue, Thu 2-4

      Hi everyone! I’m a rising fourth-year international student from Jordan, double majoring in Data science and Linguistics. I like traveling, compiling playlists, and rating every restaurant in Berkeley. I hope you enjoy the course!

      Readers

      Aneesh Durai

      Aneesh Durai

      He/Him/His

      aneesh.durai@berkeley.edu

      Hi! I’m Aneesh, and I’m very excited to be working with you this summer!

      Anthony Zhang

      Anthony Zhang

      He/Him/His

      anthony_zhang1234@berkeley.edu

      yooo it’s anthony - im an expert in bonking on my bike, entering food coma, and tripping myself in dance dance revolution. i like to study quik mafs and cs

      Archer Parry

      Archer Parry

      He/Him/His

      archerp@berkeley.edu

      Hi, I am a rising senior that enjoys hanging out with friends and playing games in my free time.

      Asbah Wasim

      Asbah Wasim

      She/Her/Hers

      asbahwasim@berkeley.edu

      Hi there, welcome to Data 100! I am a rising junior studying Cognitive Science and Data Science. In my free time, I enjoy drawing nature, painting scenery, organizing, and going on walks. I look forward to meeting you over the summer, and hope you have a great time in the class!

      Hans Mao

      Hans Mao

      He/Him/His

      huanzhimao@berkeley.edu

      Hello! I’m a rising junior majoring in CS and Stat. I’m interested in computer security, distributed systems, and machine learning. I <3 Data 100! Besides teaching, I enjoy sailing, hiking, and swimming. Looking forward to an awesome semester :o (Generated by ChatGPT)

      Matthew Lee

      Matthew Lee

      He/Him/His

      matthewlee3@berkeley.edu

      hey i’m matthew and i like great vibes. please hit me up if you have a life changing restaurant.

      Yehchan Yoo

      Yehchan Yoo

      He/Him/His

      yehchanyoo@berkeley.edu

      Hello — I am a senior majoring in Statistics and Political Economy & minoring in Data Science; I like to read the news, watch YouTube videos, listen to rock and electronic music, mediate, lift weights, and do boxing in my free time. Hope you all will enjoy the course, and always feel free to reach out!

      diff --git a/_site/staffers/sheets_parser.json b/_site/staffers/sheets_parser.json deleted file mode 100644 index a6ea8e8..0000000 --- a/_site/staffers/sheets_parser.json +++ /dev/null @@ -1,13 +0,0 @@ -{ - "type": "service_account", - "project_id": "staff-page-389720", - "private_key_id": "207afa5f22bdb4a31c77ffd2ca548c6a85d5d7ac", - "private_key": "-----BEGIN PRIVATE KEY-----\nMIIEuwIBADANBgkqhkiG9w0BAQEFAASCBKUwggShAgEAAoIBAQC1qsb5ofN0+MpI\nR94G8KarUb3WwL4BZY7qKs3FhQdvU3rpi0rKsLjRbs3PHAFT9eUmDVvZau4otO4n\nAvD8rMOTsvmm4WmsfjPVv2ktN4xzVKubZWsTJKuzpDhMtG948jALMRCsLGJyM7SZ\nTX8VazEfzbxoE7eQhOY3z/TJG6zO8vjXb359Fq7TH957w0ruDDAv/Qt35Qn5Fzz2\ndmL9JHXbCc9iUoVvKNlTHDSj1D3tzAuHyWIijh6ucUBm/XWr/IN8fo4+lqyqAGBi\n72Cd7Ry085nFvqn7b6GA5KuF7sAM1gY3D4pNxuhQdmYVOcslhlaiYccpYIUrq7Eg\nO0gazfT/AgMBAAECgf9cQFzKZ3M58xzFl7knzQzV8qx0YWwbSXdJcnML2oHsBnhk\nIFfaleNEdwAMLCyAdl3m9OGvhp1qDnbhWJ0HsrOeTUR5ef4vmea4pHrEe3DXICgE\nwXuePQD0OHBeg0IYKOQ8yq2swN09IQSU1MW0GrrXa6JBN8H/oX1G2lNzzJn0fJCr\ns8Y1BUqwG+G1BRPx0DQ5EGVAOk38QlwvRntD7V654CTn7yIoSdz0LW515TG4jaZ7\nZPjeM4wRgBwYIYX4OijcJbIuYkes0kSqFRhpJR7q3ZZ5lSoOpi4uDNTs58q+ZOo4\noslHueDmC5ndnnonTHG7xPJrrkbEjuoykDLrqLECgYEA+FUYwav8tEZKzOoemD8x\nJXqN5DEJJF9yeSs7V7GlCkpRyjg2ckkSCHY4gQ8vkKZeJflBGypP1yAHF3ZTMvQr\neTGLJxNh1V2kenJjC4Lrcy1P2/BsmNUR4SIqGScQzWbdGWRPp8DmF8+VlFByfpVn\n+2v1GpGhdMa8NQhAbPfhDysCgYEAu0a8QucquCuNDf4lHw+P6yE2zBJufsfLeBbH\nhFKR3H6DG0GWFug2SII5lsFKxapjUct9iWgl1M9OPW44zF25J6jenakUbNf5jF4i\nd5SgH4+LHaexTO+YXEak4yg+/yeTMoDtKZufhHFGPEhIl9dz00XB+vzpA7IPng0x\nNrzOJ30CgYEA7m5mEq3bOAu1jgHL1kn2GhINYmdia7Xo50YG+C/sUnEBDrPiMuDN\nm6pGnkPCW5QhGTy0sixx9A8gP/qv72BYzUgwXxhQ+teqMJbbWhYdkrySzI2O9z68\np/hxiyzjCRQWfWa+xEaFpZ798yU6iSdSayhAcX4aE1EtK438raNiR3kCgYB2VDZl\ny2xZm+LvQXKxEoMr3Pujq823O4RbZ4E/IXDaMfGjCijMZoLOA8Jhd9ZH2OYSa5Hx\nfSXSNf5IoFkw/9MatP+b/JZUQ46A24XJqtYVuvv6i9diNk09mMFcajSLwbSnB4FS\ndesvoubu9fkwP8kGaCAt9xk/5YUqp0k+PcPAfQKBgHtj16Z8H1S+gNk1/0kQ1Un0\nPgqGtoDOiONJ8QmIAHQ3HNBcYX79BohOVVuYUZTbwZ8Yxr4X980c83FBE1P1XG8p\nUnW0GyghzrvQsCZHKP6El4F4aOKF2MLoMs1irXv5W4c2UV1i7K3Kjk+24Joh49kq\nfFD3GCcYd01uyVLZauZp\n-----END PRIVATE KEY-----\n", - "client_email": "data100-staff-page@staff-page-389720.iam.gserviceaccount.com", - "client_id": "108023473760832906636", - "auth_uri": "https://accounts.google.com/o/oauth2/auth", - "token_uri": "https://oauth2.googleapis.com/token", - "auth_provider_x509_cert_url": "https://www.googleapis.com/oauth2/v1/certs", - "client_x509_cert_url": "https://www.googleapis.com/robot/v1/metadata/x509/data100-staff-page%40staff-page-389720.iam.gserviceaccount.com", - "universe_domain": "googleapis.com" -} diff --git a/_site/syllabus/index.html b/_site/syllabus/index.html index 2a9b015..62b8eab 100644 --- a/_site/syllabus/index.html +++ b/_site/syllabus/index.html @@ -1 +1 @@ - Syllabus | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

      Syllabus

      Jump to:


      About Data 100

      Combining data, computation, and inferential thinking, data science is redefining how people and organizations solve challenging problems and understand their world. This intermediate level class bridges between Data 8 and upper division computer science and statistics courses as well as methods courses in other fields. In this class, we explore key areas of data science including question formulation, data collection and cleaning, visualization, statistical inference, predictive modeling, and decision making.​ Through a strong emphasis on data centric computing, quantitative critical thinking, and exploratory data analysis, this class covers key principles and techniques of data science. These include languages for transforming, querying and analyzing data; algorithms for machine learning methods including regression, classification and clustering; principles behind creating informative data visualizations; statistical concepts of measurement error and prediction; and techniques for scalable data processing.

      Goals

      • Prepare students for advanced Berkeley courses in data-management, machine learning, and statistics, by providing the necessary foundation and context.
      • Enable students to start careers as data scientists by providing experience working with real-world data, tools, and techniques.
      • Empower students to apply computational and inferential thinking to address real-world problems.

      Prerequisites

      While we are working to make this class widely accessible, we currently require the following (or equivalent) prerequisites. Prerequisites will be enforced in Data 100. It is your responsibility to know the material in the prerequisites. The instructors do not have the authority to waive these requirements. Undergraduates should fill out the Enrollment Exception Form managed by CDSS to request an exception.

      • Foundations of Data Science: Data 8 covers much of the material in Data 100 but at an introductory level. Data 8 provides basic exposure to python programming and working with tabular data as well as visualization, statistics, and machine learning.

      • Computing: The Structure and Interpretation of Computer Programs (CS 61A) or Computational Structures in Data Science (Data 88C). These courses provide additional background in python programming (e.g., for loops, lambdas, debugging, and complexity) that will enable Data 100 to focus more on the concepts in Data Science and less on the details of programming in python.

      • Math: Linear Algebra (Math 54, EECS 16A, Math 91, Math 110, or Stat 89A). We will need some basic concepts like linear operators, eigenvectors, derivatives, and integrals to enable statistical inference and derive new prediction algorithms. This may be satisfied concurrently to Data 100.

      Please consult the Resources page for additional resources for reviewing prerequisite material.

      Textbook: There is no official textbook for Data 100 this semester; we will provide course notes that will be released with the respective lectures.

      Course Culture

      Students taking Data C100 come from a wide range of backgrounds. We hope to foster an inclusive and safe learning environment based on curiosity rather than competition. All members of the course community — the instructors, students, and course staff — are expected to treat each other with courtesy and respect. Some of the responsibility for that lies with the staff, but a lot of it ultimately rests with you, the students.

      Be Aware of Your Actions

      Sometimes, the little things add up to creating an unwelcoming culture to some students. For example, you and a friend may think you are sharing in a private joke about other races, majors, genders, abilities, cultures, etc. but this can have adverse effects on classmates who overhear it. There is a great deal of research on something called “stereotype threat”: research finds that simply reminding someone that they belong to a particular culture or share a particular identity (on whatever dimension) can interfere with their course performance.

      Stereotype threat works both ways: you can assume that a student will struggle based on who they appear to be, or you can assume that a student is doing great based on who they appear to be. Both are potentially harmful.

      Bear in mind that diversity has many facets, some of which are not visible. Your classmates may have medical conditions (physical or mental), personal situations (financial, family, etc.), or interests that aren’t common to most students in the course. Another aspect of professionalism is avoiding comments that (likely unintentionally) put down colleagues for situations they cannot control. Bragging in open space that an assignment is easy or “crazy,” for example, can send subtle cues that discourage classmates who are dealing with issues that you can’t see. Please take care, so we can create a class in which all students feel supported and respected.

      Be Respectful

      Beyond the slips that many of us make unintentionally are a host of behaviors that the course staff, department, and university do not tolerate. These are generally classified under the term harassment; sexual harassment is a specific form that is governed by federal laws known as Title IX.

      UC Berkeley’s Title IX website provides many resources for understanding the terms, procedures, and policies around harassment. Make sure you are aware enough of these issues to avoid crossing a line in your interactions with other students. For example, repeatedly asking another student out on a date after they have said no can cross this line.

      Your reaction to this topic might be to laugh it off, or to make or think snide remarks about “political correctness” or jokes about consent or other things. You might think people just need to grow a thicker skin or learn to take a joke. This isn’t your decision to make. Research shows the consequences (emotional as well as physical) on people who experience harassment. When your behavior forces another student to focus on something other than their education, you have crossed a line. You have no right to take someone else’s education away from them.

      Communicate Issues with Course Staff and/or the Department

      We take all complaints about unprofessional or discriminatory behavior seriously. Professionalism and respect for diversity are not just matters between students; they also apply to how the course staff treat the students. The staff of this course will treat you in a way that respects our differences. However, despite our best efforts, we might slip up, hopefully inadvertently. If you are concerned about classroom environment issues created by the staff or overall class dynamic, please feel free to talk to us about it. The instructors in particular welcome any comments or concerns regarding conduct of the course and the staff. See below for how to best reach us.

      From the Data Science Department: Data Science Undergraduate Studies faculty and staff are committed to creating a community where every person feels respected, included, and supported. We recognize that incidents may happen, sometimes unintentionally, that run counter to this goal. There are many things we can do to try to improve the climate for students, but we need to understand where the challenges lie. If you experience a remark, or disrespectful treatment, or if you feel you are being ignored, excluded or marginalized in a course or program-related activity, please speak up. Consider talking to your instructor, but you are also welcome to contact Executive Director Christina Teller at cpteller@berkeley.edu or report an incident anonymously through this online form.

      As course staff, we are committed to creating a learning environment welcoming of all students that supports a diversity of thoughts, perspectives and experiences and respects your identities and backgrounds (including race, ethnicity, nationality, gender identity, socioeconomic class, sexual orientation, language, religion, ability, and more.) To help accomplish this:

      • If your name and/or pronouns differ from those that appear in your official records, please let us know.
      • If you feel like your performance in the class is being affected by your experiences outside of class (e.g., family matters, current events), please don’t hesitate to come and talk with us. We want to be resources for you.
      • We (like many people) are still in the process of learning about diverse perspectives and identities. If something was said in class (by anyone) that made you feel uncomfortable, please talk to us about it.
      • While the course staff understands that improving diversity, equity, and inclusion (DEI) are not enough to overcome systemic issues in academia such as racism, queerphobia, and other forms of discrimination and hatred, we also recognize the importance of DEI work.
      • If there are other resources you think we should list here, let us know!

      Course Delivery

      In keeping with departmental guidelines set by the Division of Computing, Data Science, and Society, all Data Science courses at Berkeley are offered fully in-person in Summer 2023. This summer’s offering of Data 100 will be taught solely in-person.

      If you are unable to attend in-person discussion sections and office hours this summer, you are strongly encouraged to consider taking a different course. If you are unable to attend the in-person Midterm and Final, you cannot take Data 100 in Summer 2023.

      Course Components

      Below is a high-level “typical week in the course” for Summer 2023.

      Mo Tu We Th Fr Sat
      Office Hours Office Hours Office Hours Office Hours Office Hours  
      Live Lecture Live Lecture Live Lecture Live Lecture    
      Discussion Section   Discussion Section   Exam Prep/Catch-Up  
      Homework due     Homework due    
                2 Labs due
      • All deadlines are subject to change.
      • Office Hours are scheduled on the Calendar page.
      • Lectures, discussions, assignments, projects, and exams are scheduled on the Home page.

      Lecture

      There are 4 live lectures held Mondays to Thursdays, 5:00 pm - 6:30 pm, in-person in Li Ka Shing 245. All lecture recordings, slides, activities, and examples will be provided to the course website within 24 hours of the lecture.

      Discussion

      Live discussion sections are one hour long sessions held twice weekly on Mondays and Wednesdays. The goal of these GSI-led sessions is to work through problems, hone your skills, and flesh out your understanding as part of a team. The problems that you solve and present as part of discussion are important in understanding course material.

      The lectures, assignments, and exams of this course are structured with the expectation that all students attend discussion. The content covered in these sections is designed to solidify understanding of key lecture concepts and prepare students for homework assignments. It is to your benefit to actively participate in all discussions!

      • Discussion attendance will be recorded each week and account for 5% of the overall grade
      • All students are automatically granted 3 discussion drops to use for illness, personal emergencies, or other extenuating circumstances. These drops are designed to account for unexpected events – you should not plan to use them!
      • Attending the exam-prep session on Friday can replace either a missed Monday or a missed Wednesday section only for that specific week. Details about exam-prep sections will be released in the second week of classes.
      • Students with low discussion attendance scores may alternatively shift this 5% of the course grade onto their homework score. Course staff will automatically determine which grading policy will maximize your final grade in the course at the end of the semester.

      You will be invited to share your timing preferences for discussions and assigned to a section in the first week of classes.

      Homework and Projects

      Homeworks are half-week-long assignments designed to help students develop an in-depth understanding of both the theoretical and practical aspects of ideas presented in lecture. Projects are week-long assignments (with a half-week checkpoint) that synthesize multiple topics. Typically, assignments will be due at 11:59 pm on Mondays and Thursdays.

      • All homeworks and projects must be submitted to Gradescope by their posted deadlines.
        • Each assignment will include detailed instructions on how to submit your work for grading. It is the student’s responsibility to read these carefully and ensure that their work is submitted correctly. Assignment accommodations will not be granted in cases where students have mis-submitted their work (for example, by submitting to the wrong portal, submitting only part of an assignment, forgetting to select pages, or failing to pass autograder tests)
      • Homeworks and projects have both visible and hidden autograder tests. The visible tests are mainly sanity checks. For example, a sanity check might verify that the answer you entered is a number as expected, and not a word. The hidden tests generally check for correctness, and are invisible to students while they are doing the assignment.
      • The primary form of support students will have for homeworks and projects are office hours and Ed.
      • Homeworks and projects must be completed individually. See the Collaboration Policy for more details.
      • See the Policies section for the submission grace period.

      Lab

      Labs are shorter programming assignments designed to give students familiarity with new ideas. They are meant to be completed prior to homework.

      Two lab assignments will be released at the start of each week, covering content that will be presented in that week’s lectures. The first of these two assignments will cover the content presented in Monday’s and Tuesday’s lectures; the second will cover the content presented in Wednesday’s and Thursday’s lectures. Both weekly lab assignments are due at 11:59 pm on the Saturday of the corresponding week.

      • All lab assignments must be submitted to Gradescope by their posted deadlines.
      • All lab autograder tests are visible. Receiving full points on the autograder guarantees that you will be awarded full points on the lab assignment.
      • All lab assignments will be accompanied by a video walkthrough with explanations of key concepts. There will be no synchronous lab sections, however, students are welcome to bring questions about lab to office hours.
      • All labs are intended to take about an hour.

      Exams

      There will be two exams in this course:

      • Midterm on Thursday, July 20 5-7 PM.
      • Final on Thursday, August 10 5-7 PM.

      All exams must be taken in-person. There will be one alternate final exam on August 10 6:30-8:30PM.

      Office Hours and Communication

      We want to enable everyone to succeed in this course. We encourage you to discuss course content with your friends, classmates, and course staff throughout the semester, particularly during office hours.

      • All office hours are listed on the Calendar.
      • GSI office hours will be held in Warren Hall 101B.
      • In general, students can come to GSI office hours for any questions on course assignments or material.
      • Instructor office hours are generally reserved for conceptual questions, course review, or course logistics.

      Course Communication:

      • EdStem, or Ed for short, is our course forum this semester. The course is here. All course announcements will be through Ed. We are not using bCourses this semester. Please check out Ed or the FAQ page first before emailing course staff directly.

      Ed is your primary platform for asking questions about the class. It is monitored daily by the entire course staff, so questions posted to Ed will likely receive the fastest response. If you need to discuss a more sensitive matter, the following emails are monitored by a smaller subset of the teaching team:

      Policies

      Grading Scheme

      Category Percentage Details
      Homeworks 25% Drop lowest
      Projects 15% No drop
      Labs 10% Drop 2 lowest scores
      Discussion 5% Drop 3 lowest scores
      Midterm Exam 15%  
      Final Exam 30%  

      Discussion attendance is expected for the summer session. Students with low discussion attendance scores may alternatively shift this 5% of the course grade onto their homework score, such that homework is worth 30% of the overall grade. Course staff will automatically apply whichever grading policy will maximize your final grade in the course at the end of the semester.

      On-Time Submission

      All assignments are due at 11:59 PM Pacific Time on the due date specified on the Home / Schedule page. The date and time of this deadline are firm. Submitting even a minute past is considered late.

      Submitting by this “on-time” deadline earns an extra-credit on-time bonus, a 3% perk. This is available for homeworks, projects, and labs.

      Grace Period

      We recognize that life can be unexpected, and that you may face circumstances that prevent you from submitting your work by the posted deadline. In light of this, we offer a 1-day (24 hour) grace period for late submissions of homeworks, projects, and labs. Note that this grace period is designed to account for unexpected emergencies or assignment submission errors – you should not plan in advance to use it!

      You can make a late submission after the on-time deadline and up to the end of the grace period. These late submissions are not penalized, but do not earn 3% the on-time bonus. You do not need to explicitly contact staff about late submissions; just submit directly to Gradescope within the listed grace period.

      Submissions are not accepted beyond the grace period. The grace period is strictly enforced. We recommend thinking of the grace period as a backup, in case something unexpected comes up when aiming for the on-time deadline. As a result, getting an extension beyond the grace period will generally not be granted, except in rare, extraordinary emergencies (see the Extenuating Circumstances section).

      All official communication will refer to the on-time deadline as the expected dates that you will submit assignments.

      Extenuating Circumstances

      We recognize that our students come from varied backgrounds and have widely-varying experiences. If you encounter extenuating circumstances at any time in the semester, please do not hesitate to let us know. The sooner we are made aware, the more options we have available to us to help you.

      The Extenuating Circumstances Form is for any circumstances that cannot be resolved via the grace period policy above. Within two business days of filling out the form, a course staff will reach out to you and provide a space for conversation, as well as to arrange course/grading accommodations as necessary. For more information, please email data100.support@berkeley.edu.

      We recognize that at times, it can be difficult to manage your course performance — particularly in such a huge course, and particularly at Berkeley’s high standards. Sometimes emergencies just come up (personal health emergency, family emergency, etc.). Our Grace Period Policy combined with the Extenuating Circumstances Form is meant to lower the barrier to reaching out to us, as well as build your independence in managing your academic career long-term. So please do not hesitate to reach out.

      Note that extenuating circumstances do not extend to logistical oversight, such as Datahub/Gradescope tests not passing, submitting only one portion of the homework, forgetting to save your notebook before exporting, submitting to the wrong assignment portal, or not properly tagging pages on Gradescope. It is the student’s responsibility to identify and resolve these issues in advance of the on-time deadline. We will not grant accommodations for these cases; instead, please use the grace period to cushion these submission errors.

      DSP Accommodations

      If you are registered with the Disabled Students’ Program (DSP) you can expect to receive an email from us during the first week of classes confirming your accommodations. Otherwise, email our support email. DSP students who receive approved assignment accommodations will have the 1-day grace period added to the approved extension to the on-time deadline. Please note that any extension, plus the grace period combined, cannot exceed 5 days. DSP students can submit assignment extension accommodation requests via the Extenuating Circumstances Form.

      You are responsible for reasonable communication with course staff. If you make a request close to the deadline, we can not guarantee that you will receive a response before the deadline. Additionally, simply submitting a request does not guarantee you will receive an extension. Even if your work is incomplete, please submit before the deadline so you can receive credit for the work you did complete.

      Regrade Requests

      Students will be allowed to submit regrade requests for the autograded and written portions of assignments in cases in which the rubric was incorrectly applied or the autograder scored their submission incorrectly. Regrades for the written portions of assignments will be handled through Gradescope, and autograder regrades via a Google Form. The deadline for regrade requests (autograded and written) is one week after the grades are released for the corresponding assignment.

      Always check that the autograder executes correctly! Gradescope will show you the output of the public tests, and you should see the same results as you did on DataHub. If you see a discrepancy, ensure that you have exported the assignment correctly and, if there is still an issue, post on Ed as soon as possible.

      Regrade requests will not be considered in cases in which:

      • a student uploads the incorrect file to the autograder.
      • the autograder fails to execute and the student does not notify the course staff before the assignment deadline.
      • a student fails to save their notebook before exporting and uploads an old version to the autograder.
      • a situation arises in which the course staff cannot ensure that the student’s work was done before the assignment deadline.

      Collaboration Policy and Academic Honesty

      We will be following the EECS departmental policy on Academic Honesty, which states that using work or resources that are not your own or not permitted by the course may lead to disciplinary actions, including a failing grade in the course.

      Assignments. Data science is a collaborative activity. While you may talk with others about the homework and projects, we ask that you write your solutions individually in your own words. If you do discuss the assignments with others please include their names at the top of your notebook. Restated, you and your friends are encouraged to discuss course content and approaches to problem-solving, but you are not allowed to share your code nor answers with other students, nor are you allowed to post your assignment solutions publicly. Doing so is considered academic misconduct. We will be running advanced plagiarism detection programs on all assignments. Use of AI-assisted methods, such as ChatGPT, to generate written or code solutions to assignments is prohibited.

      Exams. Cheating on exams is a serious offense. We have methods of detecting cheating on exams – so don’t do it! Students caught cheating on any exam will fail this course.

      Plagiarism on any assignment, as well as other violations to Berkeley’s Code of Conduct, will be reported to the Center for Student Conduct. The CSC treats most first-time offenses as a Non-Reportable Warning. Additionally we reserve the right to give you a negative full score (-100%) or lower on the assignments in question, an F in the course, or even dismissal from the university. It’s just not worth it!

      Rather than copying someone else’s work, ask for help. You are not alone in Data 100! The entire staff is here to help you succeed. We expect that you will work with integrity and with respect for other members of the class, just as the course staff will work with integrity and with respect for you.

      Finally, know that it’s normal to struggle. Berkeley has high standards, which is one of the reasons its degrees are valued. Everyone struggles, even though many try not to show it. Even if you don’t learn everything that’s being covered, you’ll be able to build on what you do learn, whereas if you cheat you’ll have nothing to build on. You aren’t expected to be perfect; it’s ok not to get an A.

      Academic and Wellness Resources

      Our Resources page lists not only course-specific academic resources such as course notes, past exams, study guides, and prerequisite review links, but also campus wellness resources on COVID-19, academic support, technology support, mental well-being, DSP accommodations, dispute resolution, social services, campus community, and basic needs. Our staff will also refer to this page when supporting you through this course.

      We want you to succeed!

      If you are feeling overwhelmed, visit our office hours and talk with us, or fill out the Extenuating Circumstances Form. We know college can be stressful and we want to help you succeed.

      Important Note: We are committed to being a resource to you, but it is important to note that all members of the teaching staff for this course are responsible employees, meaning that we must disclose any incidents of sexual harassment or violence to campus authorities. If you would like to speak to a confidential advocate, please consider reaching out to the Berkeley PATH to Care Center.

      Finally, the main goal of this course is that you should learn, and have a fantastic experience doing so. Please keep that goal in mind throughout the semester. Welcome to Data 100!

      Acknowledgments

      Academic Honesty policy and closing words adapted from Data 8. Course Culture inspired and adapted with permission from Dr. Sarah Chasins’ Fall 2021 CS 164 Syllabus and Grace O’Connell, the Asssociate Dean for Inclusive Excellence.

      + Syllabus | Data 100 Skip to main content Link Menu Expand (external link) Document Search Copy Copied

      Syllabus

      Jump to:


      About Data 100

      Combining data, computation, and inferential thinking, data science is redefining how people and organizations solve challenging problems and understand their world. This intermediate level class bridges between Data 8 and upper division computer science and statistics courses as well as methods courses in other fields. In this class, we explore key areas of data science including question formulation, data collection and cleaning, visualization, statistical inference, predictive modeling, and decision making.​ Through a strong emphasis on data centric computing, quantitative critical thinking, and exploratory data analysis, this class covers key principles and techniques of data science. These include languages for transforming, querying and analyzing data; algorithms for machine learning methods including regression, classification and clustering; principles behind creating informative data visualizations; statistical concepts of measurement error and prediction; and techniques for scalable data processing.

      Goals

      • Prepare students for advanced Berkeley courses in data-management, machine learning, and statistics, by providing the necessary foundation and context.
      • Enable students to start careers as data scientists by providing experience working with real-world data, tools, and techniques.
      • Empower students to apply computational and inferential thinking to address real-world problems.

      Prerequisites

      While we are working to make this class widely accessible, we currently require the following (or equivalent) prerequisites. Prerequisites will be enforced in Data 100. It is your responsibility to know the material in the prerequisites. The instructors do not have the authority to waive these requirements. Undergraduates should fill out the Enrollment Exception Form managed by CDSS to request an exception.

      • Foundations of Data Science: Data 8 covers much of the material in Data 100 but at an introductory level. Data 8 provides basic exposure to python programming and working with tabular data as well as visualization, statistics, and machine learning.

      • Computing: The Structure and Interpretation of Computer Programs (CS 61A) or Computational Structures in Data Science (Data 88C). These courses provide additional background in python programming (e.g., for loops, lambdas, debugging, and complexity) that will enable Data 100 to focus more on the concepts in Data Science and less on the details of programming in python.

      • Math: Linear Algebra (Math 54, EECS 16A, Math 91, Math 110, or Stat 89A). We will need some basic concepts like linear operators, eigenvectors, derivatives, and integrals to enable statistical inference and derive new prediction algorithms. This may be satisfied concurrently to Data 100.

      Please consult the Resources page for additional resources for reviewing prerequisite material.

      Textbook: There is no official textbook for Data 100 this semester; we will provide course notes that will be released with the respective lectures.

      Course Culture

      Students taking Data C100 come from a wide range of backgrounds. We hope to foster an inclusive and safe learning environment based on curiosity rather than competition. All members of the course community — the instructors, students, and course staff — are expected to treat each other with courtesy and respect. Some of the responsibility for that lies with the staff, but a lot of it ultimately rests with you, the students.

      Be Aware of Your Actions

      Sometimes, the little things add up to creating an unwelcoming culture to some students. For example, you and a friend may think you are sharing in a private joke about other races, majors, genders, abilities, cultures, etc. but this can have adverse effects on classmates who overhear it. There is a great deal of research on something called “stereotype threat”: research finds that simply reminding someone that they belong to a particular culture or share a particular identity (on whatever dimension) can interfere with their course performance.

      Stereotype threat works both ways: you can assume that a student will struggle based on who they appear to be, or you can assume that a student is doing great based on who they appear to be. Both are potentially harmful.

      Bear in mind that diversity has many facets, some of which are not visible. Your classmates may have medical conditions (physical or mental), personal situations (financial, family, etc.), or interests that aren’t common to most students in the course. Another aspect of professionalism is avoiding comments that (likely unintentionally) put down colleagues for situations they cannot control. Bragging in open space that an assignment is easy or “crazy,” for example, can send subtle cues that discourage classmates who are dealing with issues that you can’t see. Please take care, so we can create a class in which all students feel supported and respected.

      Be Respectful

      Beyond the slips that many of us make unintentionally are a host of behaviors that the course staff, department, and university do not tolerate. These are generally classified under the term harassment; sexual harassment is a specific form that is governed by federal laws known as Title IX.

      UC Berkeley’s Title IX website provides many resources for understanding the terms, procedures, and policies around harassment. Make sure you are aware enough of these issues to avoid crossing a line in your interactions with other students. For example, repeatedly asking another student out on a date after they have said no can cross this line.

      Your reaction to this topic might be to laugh it off, or to make or think snide remarks about “political correctness” or jokes about consent or other things. You might think people just need to grow a thicker skin or learn to take a joke. This isn’t your decision to make. Research shows the consequences (emotional as well as physical) on people who experience harassment. When your behavior forces another student to focus on something other than their education, you have crossed a line. You have no right to take someone else’s education away from them.

      Communicate Issues with Course Staff and/or the Department

      We take all complaints about unprofessional or discriminatory behavior seriously. Professionalism and respect for diversity are not just matters between students; they also apply to how the course staff treat the students. The staff of this course will treat you in a way that respects our differences. However, despite our best efforts, we might slip up, hopefully inadvertently. If you are concerned about classroom environment issues created by the staff or overall class dynamic, please feel free to talk to us about it. The instructors in particular welcome any comments or concerns regarding conduct of the course and the staff. See below for how to best reach us.

      From the Data Science Department: Data Science Undergraduate Studies faculty and staff are committed to creating a community where every person feels respected, included, and supported. We recognize that incidents may happen, sometimes unintentionally, that run counter to this goal. There are many things we can do to try to improve the climate for students, but we need to understand where the challenges lie. If you experience a remark, or disrespectful treatment, or if you feel you are being ignored, excluded or marginalized in a course or program-related activity, please speak up. Consider talking to your instructor, but you are also welcome to contact Executive Director Christina Teller at cpteller@berkeley.edu or report an incident anonymously through this online form.

      As course staff, we are committed to creating a learning environment welcoming of all students that supports a diversity of thoughts, perspectives and experiences and respects your identities and backgrounds (including race, ethnicity, nationality, gender identity, socioeconomic class, sexual orientation, language, religion, ability, and more.) To help accomplish this:

      • If your name and/or pronouns differ from those that appear in your official records, please let us know.
      • If you feel like your performance in the class is being affected by your experiences outside of class (e.g., family matters, current events), please don’t hesitate to come and talk with us. We want to be resources for you.
      • We (like many people) are still in the process of learning about diverse perspectives and identities. If something was said in class (by anyone) that made you feel uncomfortable, please talk to us about it.
      • While the course staff understands that improving diversity, equity, and inclusion (DEI) are not enough to overcome systemic issues in academia such as racism, queerphobia, and other forms of discrimination and hatred, we also recognize the importance of DEI work.
      • If there are other resources you think we should list here, let us know!

      Course Delivery

      In keeping with departmental guidelines set by the Division of Computing, Data Science, and Society, all Data Science courses at Berkeley are offered fully in-person in Summer 2023. This summer’s offering of Data 100 will be taught solely in-person.

      If you are unable to attend in-person discussion sections and office hours this summer, you are strongly encouraged to consider taking a different course. If you are unable to attend the in-person Midterm and Final, you cannot take Data 100 in Summer 2023.

      Course Components

      Below is a high-level “typical week in the course” for Summer 2023.

      Mo Tu We Th Fr Sat
      Office Hours Office Hours Office Hours Office Hours Office Hours  
      Live Lecture Live Lecture Live Lecture Live Lecture    
      Discussion Section   Discussion Section   Exam Prep/Catch-Up  
      Homework due     Homework due    
                2 Labs due
      • All deadlines are subject to change.
      • Office Hours are scheduled on the Calendar page.
      • Lectures, discussions, assignments, projects, and exams are scheduled on the Home page.

      Lecture

      There are 4 live lectures held Mondays to Thursdays, 5:00 pm - 6:30 pm, in-person in Li Ka Shing 245. All lecture recordings, slides, activities, and examples will be provided to the course website within 24 hours of the lecture.

      Discussion

      Live discussion sections are one hour long sessions held twice weekly on Mondays and Wednesdays. The goal of these GSI-led sessions is to work through problems, hone your skills, and flesh out your understanding as part of a team. The problems that you solve and present as part of discussion are important in understanding course material.

      The lectures, assignments, and exams of this course are structured with the expectation that all students attend discussion. The content covered in these sections is designed to solidify understanding of key lecture concepts and prepare students for homework assignments. It is to your benefit to actively participate in all discussions!

      • Discussion attendance will be recorded each week and account for 5% of the overall grade
      • All students are automatically granted 3 discussion drops to use for illness, personal emergencies, or other extenuating circumstances. These drops are designed to account for unexpected events – you should not plan to use them!
      • Attending the exam-prep session on Friday can replace either a missed Monday or a missed Wednesday section only for that specific week. Details about exam-prep sections will be released in the second week of classes.
      • Students with low discussion attendance scores may alternatively shift this 5% of the course grade onto their homework score. Course staff will automatically determine which grading policy will maximize your final grade in the course at the end of the semester.

      You will be invited to share your timing preferences for discussions and assigned to a section in the first week of classes.

      Homework and Projects

      Homeworks are half-week-long assignments designed to help students develop an in-depth understanding of both the theoretical and practical aspects of ideas presented in lecture. Projects are week-long assignments (with a half-week checkpoint) that synthesize multiple topics. Typically, assignments will be due at 11:59 pm on Mondays and Thursdays.

      • All homeworks and projects must be submitted to Gradescope by their posted deadlines.
        • Each assignment will include detailed instructions on how to submit your work for grading. It is the student’s responsibility to read these carefully and ensure that their work is submitted correctly. Assignment accommodations will not be granted in cases where students have mis-submitted their work (for example, by submitting to the wrong portal, submitting only part of an assignment, forgetting to select pages, or failing to pass autograder tests)
      • Homeworks and projects have both visible and hidden autograder tests. The visible tests are mainly sanity checks. For example, a sanity check might verify that the answer you entered is a number as expected, and not a word. The hidden tests generally check for correctness, and are invisible to students while they are doing the assignment.
      • The primary form of support students will have for homeworks and projects are office hours and Ed.
      • Homeworks and projects must be completed individually. See the Collaboration Policy for more details.
      • See the Policies section for the submission grace period.

      Lab

      Labs are shorter programming assignments designed to give students familiarity with new ideas. They are meant to be completed prior to homework.

      Two lab assignments will be released at the start of each week, covering content that will be presented in that week’s lectures. The first of these two assignments will cover the content presented in Monday’s and Tuesday’s lectures; the second will cover the content presented in Wednesday’s and Thursday’s lectures. Both weekly lab assignments are due at 11:59 pm on the Saturday of the corresponding week.

      • All lab assignments must be submitted to Gradescope by their posted deadlines.
      • All lab autograder tests are visible. Receiving full points on the autograder guarantees that you will be awarded full points on the lab assignment.
      • All lab assignments will be accompanied by a video walkthrough with explanations of key concepts. There will be no synchronous lab sections, however, students are welcome to bring questions about lab to office hours.
      • All labs are intended to take about an hour.

      Exams

      There will be two exams in this course:

      • Midterm on Thursday, July 20 5-7 PM.
      • Final on Thursday, August 10 5-7 PM.

      All exams must be taken in-person. There will be one alternate final exam on August 10 6:30-8:30PM.

      Office Hours and Communication

      We want to enable everyone to succeed in this course. We encourage you to discuss course content with your friends, classmates, and course staff throughout the semester, particularly during office hours.

      • All office hours are listed on the Calendar.
      • GSI office hours will be held in Warren Hall 101B.
      • In general, students can come to GSI office hours for any questions on course assignments or material.
      • Instructor office hours are generally reserved for conceptual questions, course review, or course logistics.

      Course Communication:

      • EdStem, or Ed for short, is our course forum this semester. The course is here. All course announcements will be through Ed. We are not using bCourses this semester. Please check out Ed or the FAQ page first before emailing course staff directly.

      Ed is your primary platform for asking questions about the class. It is monitored daily by the entire course staff, so questions posted to Ed will likely receive the fastest response. If you need to discuss a more sensitive matter, the following emails are monitored by a smaller subset of the teaching team:

      Policies

      Grading Scheme

      Category Percentage Details
      Homeworks 25% Drop lowest
      Projects 15% No drop
      Labs 10% Drop 2 lowest scores
      Discussion 5% Drop 3 lowest scores
      Midterm Exam 15%  
      Final Exam 30%  

      Discussion attendance is expected for the summer session. Students with low discussion attendance scores may alternatively shift this 5% of the course grade onto their homework score, such that homework is worth 30% of the overall grade. Course staff will automatically apply whichever grading policy will maximize your final grade in the course at the end of the semester.

      On-Time Submission

      All assignments are due at 11:59 PM Pacific Time on the due date specified on the Home / Schedule page. The date and time of this deadline are firm. Submitting even a minute past is considered late.

      Submitting by this “on-time” deadline earns an extra-credit on-time bonus, a 3% perk. This is available for homeworks, projects, and labs.

      Grace Period

      We recognize that life can be unexpected, and that you may face circumstances that prevent you from submitting your work by the posted deadline. In light of this, we offer a 1-day (24 hour) grace period for late submissions of homeworks, projects, and labs. Note that this grace period is designed to account for unexpected emergencies or assignment submission errors – you should not plan in advance to use it!

      You can make a late submission after the on-time deadline and up to the end of the grace period. These late submissions are not penalized, but do not earn 3% the on-time bonus. You do not need to explicitly contact staff about late submissions; just submit directly to Gradescope within the listed grace period.

      Submissions are not accepted beyond the grace period. The grace period is strictly enforced. We recommend thinking of the grace period as a backup, in case something unexpected comes up when aiming for the on-time deadline. As a result, getting an extension beyond the grace period will generally not be granted, except in rare, extraordinary emergencies (see the Extenuating Circumstances section).

      All official communication will refer to the on-time deadline as the expected dates that you will submit assignments.

      Extenuating Circumstances

      We recognize that our students come from varied backgrounds and have widely-varying experiences. If you encounter extenuating circumstances at any time in the semester, please do not hesitate to let us know. The sooner we are made aware, the more options we have available to us to help you.

      The Extenuating Circumstances Form is for any circumstances that cannot be resolved via the grace period policy above. Within two business days of filling out the form, a course staff will reach out to you and provide a space for conversation, as well as to arrange course/grading accommodations as necessary. For more information, please email data100.support@berkeley.edu.

      We recognize that at times, it can be difficult to manage your course performance — particularly in such a huge course, and particularly at Berkeley’s high standards. Sometimes emergencies just come up (personal health emergency, family emergency, etc.). Our Grace Period Policy combined with the Extenuating Circumstances Form is meant to lower the barrier to reaching out to us, as well as build your independence in managing your academic career long-term. So please do not hesitate to reach out.

      Note that extenuating circumstances do not extend to logistical oversight, such as Datahub/Gradescope tests not passing, submitting only one portion of the homework, forgetting to save your notebook before exporting, submitting to the wrong assignment portal, or not properly tagging pages on Gradescope. It is the student’s responsibility to identify and resolve these issues in advance of the on-time deadline. We will not grant accommodations for these cases; instead, please use the grace period to cushion these submission errors.

      DSP Accommodations

      If you are registered with the Disabled Students’ Program (DSP) you can expect to receive an email from us during the first week of classes confirming your accommodations. Otherwise, email our support email. DSP students who receive approved assignment accommodations will have the 1-day grace period added to the approved extension to the on-time deadline. Please note that any extension, plus the grace period combined, cannot exceed 5 days. DSP students can submit assignment extension accommodation requests via the Extenuating Circumstances Form.

      You are responsible for reasonable communication with course staff. If you make a request close to the deadline, we can not guarantee that you will receive a response before the deadline. Additionally, simply submitting a request does not guarantee you will receive an extension. Even if your work is incomplete, please submit before the deadline so you can receive credit for the work you did complete.

      Regrade Requests

      Students will be allowed to submit regrade requests for the autograded and written portions of assignments in cases in which the rubric was incorrectly applied or the autograder scored their submission incorrectly. Regrades for the written portions of assignments will be handled through Gradescope, and autograder regrades via a Google Form. The deadline for regrade requests (autograded and written) is one week after the grades are released for the corresponding assignment.

      Always check that the autograder executes correctly! Gradescope will show you the output of the public tests, and you should see the same results as you did on DataHub. If you see a discrepancy, ensure that you have exported the assignment correctly and, if there is still an issue, post on Ed as soon as possible.

      Regrade requests will not be considered in cases in which:

      • a student uploads the incorrect file to the autograder.
      • the autograder fails to execute and the student does not notify the course staff before the assignment deadline.
      • a student fails to save their notebook before exporting and uploads an old version to the autograder.
      • a situation arises in which the course staff cannot ensure that the student’s work was done before the assignment deadline.

      Collaboration Policy and Academic Honesty

      We will be following the EECS departmental policy on Academic Honesty, which states that using work or resources that are not your own or not permitted by the course may lead to disciplinary actions, including a failing grade in the course.

      Assignments. Data science is a collaborative activity. While you may talk with others about the homework and projects, we ask that you write your solutions individually in your own words. If you do discuss the assignments with others please include their names at the top of your notebook. Restated, you and your friends are encouraged to discuss course content and approaches to problem-solving, but you are not allowed to share your code nor answers with other students, nor are you allowed to post your assignment solutions publicly. Doing so is considered academic misconduct. We will be running advanced plagiarism detection programs on all assignments. Use of AI-assisted methods, such as ChatGPT, to generate written or code solutions to assignments is prohibited.

      Exams. Cheating on exams is a serious offense. We have methods of detecting cheating on exams – so don’t do it! Students caught cheating on any exam will fail this course.

      Plagiarism on any assignment, as well as other violations to Berkeley’s Code of Conduct, will be reported to the Center for Student Conduct. The CSC treats most first-time offenses as a Non-Reportable Warning. Additionally we reserve the right to give you a negative full score (-100%) or lower on the assignments in question, an F in the course, or even dismissal from the university. It’s just not worth it!

      Rather than copying someone else’s work, ask for help. You are not alone in Data 100! The entire staff is here to help you succeed. We expect that you will work with integrity and with respect for other members of the class, just as the course staff will work with integrity and with respect for you.

      Finally, know that it’s normal to struggle. Berkeley has high standards, which is one of the reasons its degrees are valued. Everyone struggles, even though many try not to show it. Even if you don’t learn everything that’s being covered, you’ll be able to build on what you do learn, whereas if you cheat you’ll have nothing to build on. You aren’t expected to be perfect; it’s ok not to get an A.

      Academic and Wellness Resources

      Our Resources page lists not only course-specific academic resources such as course notes, past exams, study guides, and prerequisite review links, but also campus wellness resources on COVID-19, academic support, technology support, mental well-being, DSP accommodations, dispute resolution, social services, campus community, and basic needs. Our staff will also refer to this page when supporting you through this course.

      We want you to succeed!

      If you are feeling overwhelmed, visit our office hours and talk with us, or fill out the Extenuating Circumstances Form. We know college can be stressful and we want to help you succeed.

      Important Note: We are committed to being a resource to you, but it is important to note that all members of the teaching staff for this course are responsible employees, meaning that we must disclose any incidents of sexual harassment or violence to campus authorities. If you would like to speak to a confidential advocate, please consider reaching out to the Berkeley PATH to Care Center.

      Finally, the main goal of this course is that you should learn, and have a fantastic experience doing so. Please keep that goal in mind throughout the semester. Welcome to Data 100!

      Acknowledgments

      Academic Honesty policy and closing words adapted from Data 8. Course Culture inspired and adapted with permission from Dr. Sarah Chasins’ Fall 2021 CS 164 Syllabus and Grace O’Connell, the Asssociate Dean for Inclusive Excellence.

      diff --git a/_staffers/bella_crouch.md b/_staffers/bella_crouch.md deleted file mode 100644 index 203af6e..0000000 --- a/_staffers/bella_crouch.md +++ /dev/null @@ -1,10 +0,0 @@ ---- -name: Bella Crouch -role: Instructor -email: isabella.crouch@berkeley.edu -website: -photo: http://ds100.org/sp23/resources/assets/staff_pics/Bella_Crouch.jpeg -pronouns: She/Her/Hers -oh: Tue, Th 3-4pm (Warren 111) ---- - diff --git a/_staffers/dominic_liu.md b/_staffers/dominic_liu.md deleted file mode 100644 index b8bfb7e..0000000 --- a/_staffers/dominic_liu.md +++ /dev/null @@ -1,9 +0,0 @@ ---- -name: Dominic Liu -role: Instructor -email: hangxingliu@berkeley.edu -website: -photo: http://ds100.org/su23/resources/assets/staff_pics/Dominic_Liu.JPG -pronouns: He/Him/His -oh: Mon, Wed 3-4pm (Warren 111) ---- \ No newline at end of file diff --git a/_staffers/fernando_perez.md b/_staffers/fernando_perez.md new file mode 100644 index 0000000..801cbe7 --- /dev/null +++ b/_staffers/fernando_perez.md @@ -0,0 +1,9 @@ +--- +name: Fernando Pérez +role: Instructor +email: fernando.perez@berkeley.edu +website: +photo: http://ds100.org/su23/resources/assets/staff_pics/Fernando_Perez.jpeg +pronouns: He/Him/His +oh: +--- \ No newline at end of file diff --git a/_staffers/narges_norouzi.md b/_staffers/narges_norouzi.md new file mode 100644 index 0000000..f335eac --- /dev/null +++ b/_staffers/narges_norouzi.md @@ -0,0 +1,10 @@ +--- +name: Narges Norouzi +role: Instructor +email: norouzi@berkeley.edu +website: +photo: http://ds100.org/sp23/resources/assets/staff_pics/Narges_Norouzi.jpeg +pronouns: She/Her/Hers +oh: +--- + diff --git a/index.md b/index.md index 2685a86..2fa1239 100644 --- a/index.md +++ b/index.md @@ -5,21 +5,21 @@ nav_order: 1 description: A week-to-week description of the content covered in the course. course: edstem: https://edstem.org/us/courses/33744/ - faq: https://ds100.org/sp23faq + faq: https://ds100.org/fa23faq currWeekNumber: 8 --- # Data 100: Principles and Techniques of Data Science {: .mb-2 } -UC Berkeley, Summer 2023 +UC Berkeley, Fall 2023 {: .mb-0 .fs-6 .text-grey-dk-000 } -[Ed](https://edstem.org/us/courses/40266){:target="_blank" .btn .btn-ed .mr-1 } +[Ed](){:target="_blank" .btn .btn-ed .mr-1 } [Datahub](http://data100.datahub.berkeley.edu/){:target="_blank" .btn .btn-datahub .mr-1 } -[Gradescope](https://www.gradescope.com/courses/546710){:target="_blank" .btn .btn-gradescope .mr-1 } -[Extenuating Circumstances](https://forms.gle/GRREdhkik6bKm9bJA){:target="_blank .btn .btn-blue .mr-1} +[Gradescope](https://www.gradescope.com/courses/564792){:target="_blank" .btn .btn-gradescope .mr-1 } +[Extenuating Circumstances](){:target="_blank .btn .btn-blue .mr-1}
      {% assign instructors = site.staffers | where: 'role', 'Instructor' %} @@ -31,7 +31,9 @@ UC Berkeley, Summer 2023
      {: .highlight } -> Welcome to [Week 8](#week-{{page.currWeekNumber}})! +> Announcements: + +[//]: <> > Welcome to [Week 1](#week-{{page.currWeekNumber}})! diff --git a/resources/assets/staff_pics/Fernando_Perez.jpeg b/resources/assets/staff_pics/Fernando_Perez.jpeg new file mode 100644 index 0000000..8ce1a8a Binary files /dev/null and b/resources/assets/staff_pics/Fernando_Perez.jpeg differ diff --git a/resources/assets/staff_pics/Narges_Norouzi.jpg b/resources/assets/staff_pics/Narges_Norouzi.jpg new file mode 100644 index 0000000..b93e84a Binary files /dev/null and b/resources/assets/staff_pics/Narges_Norouzi.jpg differ