diff --git a/pydata-amsterdam-2020/category.json b/pydata-amsterdam-2020/category.json new file mode 100644 index 000000000..d96aac625 --- /dev/null +++ b/pydata-amsterdam-2020/category.json @@ -0,0 +1,3 @@ +{ + "title": "PyData Amsterdam 2020" +} diff --git a/pydata-amsterdam-2020/videos/alyona-galyeva-human-like-visual-search-application-with-small-data-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/alyona-galyeva-human-like-visual-search-application-with-small-data-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..e70e0a1e2 --- /dev/null +++ b/pydata-amsterdam-2020/videos/alyona-galyeva-human-like-visual-search-application-with-small-data-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nAlyona Galyeva - Human-like Visual Search Application with Small Data | PyData Fest Amsterdam 2020\n\nDuring the workshop we cover the building blocks of Siamese Mask R-CNN model and showcase its ability to detect and segment objects from novel categories based on a single reference image. Next,we try a single deployment. Lastly, we discuss possible limitations and improvements. At the end of the workshop, participants will have a basic understanding on how to prototype and deploy human-like visual search applications.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 5333, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Alyona Galyeva" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/2l_WASP1_1A/maxresdefault.webp", + "title": "Human-like Visual Search Application with Small Data", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=2l_WASP1_1A" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/andrew-therriault-designing-for-impact-in-civic-data-science-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/andrew-therriault-designing-for-impact-in-civic-data-science-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..a2658f4ae --- /dev/null +++ b/pydata-amsterdam-2020/videos/andrew-therriault-designing-for-impact-in-civic-data-science-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nAndrew Therriault - Designing for Impact in Civic Data Science | PyData Fest Amsterdam 2020 \n\nOpen source developers create tools that are used by millions, often in ways that their creators never imagined. Open data programs share data for the same purpose, enabling others to discover insights and build applications to help understand and improve their communities. And yet while open source and open data have both grown rapidly over the past decades, successful data science projects combining the two are surprisingly hard to find.\n\nThis presentation, from the City of Boston\u2019s former Chief Data Officer, will dig into the question of why data science projects built on open data so often fall short of their potential, and give lessons for how to design projects that succeed. Participants will learn how open data programs work, see examples of innovative projects using open data, and hear about the unique challenges facing projects that seek to promote positive social change. We\u2019ll also discuss how technologists can better collaborate with the public sector, to match their work to the needs of governments and nonprofits and ensure that their efforts are put into practice.\n\nAndrew Therriault is a data scientist and educator based in Boston. He previously served as the City of Boston\u2019s Chief Data Officer and the Democratic Party\u2019s Director of Data Science, and currently teaches data science at Northeastern and Harvard. Therriault also serves as a data science and strategy consultant for clients ranging from government agencies and advocacy groups to research firms and technology startups, and holds a doctorate in political science from New York University.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 2075, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Andrew Therriault" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/1ODnn5fs6Nw/maxresdefault.webp", + "title": "Designing for Impact in Civic Data Science", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=1ODnn5fs6Nw" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/bertjan-broeksema-huib-keemink-exploring-railway-oriented-programming-in-python-pydata-fest.json b/pydata-amsterdam-2020/videos/bertjan-broeksema-huib-keemink-exploring-railway-oriented-programming-in-python-pydata-fest.json new file mode 100644 index 000000000..05ac682ca --- /dev/null +++ b/pydata-amsterdam-2020/videos/bertjan-broeksema-huib-keemink-exploring-railway-oriented-programming-in-python-pydata-fest.json @@ -0,0 +1,37 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\nBertjan Broeksema & Huib Keemink - Exploring Railway Oriented Programming in Python | PyData Fest Amsterdam 2020\n\nAn ongoing question when developing software is: how to build reliable and correct software systems? Python applications are no exception to this question. We explore a different way of dealing with errors in your Python code. Instead of using try-except, we present the Railway Oriented Programming approach.\n\nThis approaches programming as a way of combining railway segments. In combination with type annotation, this leads to interesting possibilities for developing correct and testable applications in python. But: it also puts constraints on what should and shouldn\u2019t be done in those segments.\n\nWe have set ourselves the challenge to build the Railway pattern from scratch in Python. Follow us on this journey of implementing this pattern, and see where it leads us. Is it even uesful in Python? Does it solve any problems you might have?\n\nTo follow this talk, you do not need experience with functional programming. If you know your way around python functions, you will get an introduction to a common functional pattern without the lingo!\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1754, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Bertjan Broeksema", + "Huib Keemink" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/cKixdve3JGg/maxresdefault.webp", + "title": "Exploring Railway Oriented Programming in Python", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=cKixdve3JGg" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/cheuk-ting-ho-open-source-in-the-eyes-of-a-minority-contributor-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/cheuk-ting-ho-open-source-in-the-eyes-of-a-minority-contributor-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..09918dbad --- /dev/null +++ b/pydata-amsterdam-2020/videos/cheuk-ting-ho-open-source-in-the-eyes-of-a-minority-contributor-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nCheuk Ting Ho - Open-source in the eyes of a Minority Contributor | PyData Fest Amsterdam 2020\n\nIn the first part of this talk, I will talk about my personal experience in contributing to open-source. From learning how to make a Pull Request on GitHub to maintaining libraries. From attending my first meetup to co-organizing conferences. I will tell you what I observe as a self-identifying female. My opinion on certain events that happened. And what \u201chelp\u201d do we, minorities in the community, need.\n\nIn the second part of the talk, I will change to a more subjective angle to look at the diversity issues in the open-source community, especially in Python and Data Science communities. I will try to address what effort has been made and what more we can do. In the end, I will try to convince you all the be our ally and to do the right thing to make our community more inclusive and diverse.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1647, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Cheuk Ting Ho" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/r3W-vcsQo80/maxresdefault.webp", + "title": "Open-source in the eyes of a Minority Contributor", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=r3W-vcsQo80" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/chiel-peters-python-from-source-to-execution-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/chiel-peters-python-from-source-to-execution-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..92e4e3d7f --- /dev/null +++ b/pydata-amsterdam-2020/videos/chiel-peters-python-from-source-to-execution-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nChiel Peters - Python: From Source to Execution | PyData Fest Amsterdam 2020 \n\n\u201cBeautiful is better than ugly\u201d, \u201cSimple is better than complex\u201d and \u201cThere should be one\u2013 and preferably only one \u2013obvious way to do it.\u201d are a few statements from the Zen of Python. They explain the ideology behind the language: a simple, readable but yet powerful programming language. Over the years this has made it into one of the most popular languages in the world, especially within the field of AI.\n\nIn this talk, we will go into the internals of the language and see how source code is executed. Execution in (C)Python is a multi-stage process where source code is first parsed and compiled into an intermediate representation known as Python Byte Code (those .pyc files) before being fed into the interpreter. All of this happens behind the scenes every time you run a program. The presentation will explain each stage from a conceptual level and using practical examples.\n\nAt the end of the talk, the audience will have a better understanding of the internals of Python. They will be able to reason about optimizations within the language, but foremost be able to answer \u201cHow does it work?\u201d.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1606, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Chiel Peters" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/xfC5o8HxaBk/maxresdefault.webp", + "title": "Python: From Source to Execution", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=xfC5o8HxaBk" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/guido-van-rossum-interview-at-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/guido-van-rossum-interview-at-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..81af2bc83 --- /dev/null +++ b/pydata-amsterdam-2020/videos/guido-van-rossum-interview-at-pydata-fest-amsterdam-2020.json @@ -0,0 +1,40 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchase \n\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\n\nInterviewed by Marysia Winkels & Nelson Mooren\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. \n\n0:00 - Introduction\n1:25 - Resemblance between Python and ABC\n2:40 - Prevalence of Python in Academia/DataScience\n3:40 - Guido's new position (BDFL and steering counsel)\n10:15 - Questions about steering counsel\n16:55 - Adoption of Python 3\n20:45 - Parser update for CPython in 3.9\n27:25 - Some words about scholarship winners\n29:40 - Questions\n\nS/o to https://github.com/stobinaator for the video timestamps!\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 2073, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchase", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchase" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://github.com/stobinaator", + "url": "https://github.com/stobinaator" + } + ], + "speakers": [ + "Guido Van Rossum" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi/eJUwlzR_hCY/hqdefault.jpg", + "title": "Interview", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=eJUwlzR_hCY" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/ian-ozsvald-making-pandas-fly-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/ian-ozsvald-making-pandas-fly-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..18f5c6617 --- /dev/null +++ b/pydata-amsterdam-2020/videos/ian-ozsvald-making-pandas-fly-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nIan Ozsvald - Making Pandas Fly | PyData Fest Amsterdam 2020 \n\n\u201cLarger datasets can\u2019t fit into RAM - suddenly you can\u2019t use Pandas any more - but we need to analyse that data! First we\u2019ll review techniques to compress our data (maybe cutting our DataFrame RAM usage in half!) so we can process more rows using regular Pandas. Next we\u2019ll look at clever ways to make common operations run faster on DataFrames including dropping down to numpy and making better choices for the function you call. You\u2019ll leave with new techniques to make your DataFrames smaller and ideas for processing your data faster.\n\nThis talk is inspired by Ian\u2019s work updating his O\u2019Reilly book High Performance Python to the 2nd edition for 2020. With over 10 years of evolution the Pandas DataFrame library has gained a huge amount of functionality and it is used by millions of Pythonistas - but the most obvious way to solve a task isn\u2019t always the fastest or most RAM efficient. This talk will help any Pandas user (beginner or beyond) process more data faster, making them more effective at their jobs.\u201d\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1755, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Ian Ozsvald" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/N4pj3CS857c/maxresdefault.webp", + "title": "Making Pandas Fly", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=N4pj3CS857c" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/james-powell-furious-fast-python-7-writing-fast-python-code-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/james-powell-furious-fast-python-7-writing-fast-python-code-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..741ecc141 --- /dev/null +++ b/pydata-amsterdam-2020/videos/james-powell-furious-fast-python-7-writing-fast-python-code-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nJames Powell - Furious & Fast Python 7: Writing Fast Python Code | PyData Fest Amsterdam 2020\n\nYou\u2019ve already seen the about six of these. They were kind of boring. You probably fell asleep halfway through number 5. Why is anyone still making this content? What new ground is there to cover?\n\nThis talk will cover fundamental conceptualizations and approaches to writing fast systems in Python, while critiquing how this topic has been covered in past. It will show limitations of measurement mechanisms, conceptual limitations of the \u201cstatic view\u201d of software development, and it will show problems with non-structural micro-optimizations. It will suggest intuitions and structural approaches that lead to high performance systems in practice, as well as intuitions that can guide this development from within a more cohesive and coherent framework of understanding of the software development process.\n\nSpeaker Bio: James Powell is a professional Python programmer and enthusiast. He started working with Python in the finance industry building reporting and analysis systems for prop trading front offices. He currently works as a consultant building data engineering and scientific computing platforms for a wide range of clients using cutting-edge open source tools like Python and React. He also currently serves as a Board Director, Co-Chair, and Vice President at NumFOCUS, the 501(c)3 non-profit that supports all the major tools in the Python data analysis ecosystem (incl. pandas, numpy, jupyter, matplotlib, and others). At NumFOCUS, he helps build global open source communities for data scientists, data engineers, and business analysts. He helps NumFOCUS run the PyData conference series and has sat on speaker selection and organizing committees for eighteen conferences. James is also a prolific speaker: since 2013, he has given over seventy conference talks at over fifty Python events worldwide.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 4333, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "James Powell" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/Ix04KpZiUA8/maxresdefault.webp", + "title": "Furious & Fast Python 7: Writing Fast Python Code", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=Ix04KpZiUA8" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/jim-dowling-hopsworks-ai-a-feature-store-for-machine-learning-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/jim-dowling-hopsworks-ai-a-feature-store-for-machine-learning-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..73631fbf6 --- /dev/null +++ b/pydata-amsterdam-2020/videos/jim-dowling-hopsworks-ai-a-feature-store-for-machine-learning-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\n\n\nJim Dowling - Hopsworks.AI - A feature Store for Machine Learning | PyData Fest Amsterdam 2020 \n\nA Feature Store enables machine learning (ML) features to be registered, discovered, and used as part of ML pipelines, thus making it easier to transform and validate the training data that is fed into machine learning systems.\n\nFeature stores can also enable consistent engineering of features between training and inference, but to do so, they need a common data processing platform. The first Feature Stores, developed at hyperscale AI companies such as Uber, Airbnb, and Facebook, enabled feature engineering using domain specific languages, providing abstractions tailored to the companies\u2019 feature engineering domains. However, a general purpose Feature Store needs a general purpose feature engineering, feature selection, and feature transformation platform.\n\nIn this talk, we describe how we built a general purpose, open-source Feature Store for ML on the open-source Hopsworks platform with Apache Spark. We will show how the Feature Store enables end-to-end ML pipelines to be factored into feature engineering and data science stages that each can run at different cadences. And we will show how we built the world\u2019s first managed feature store for the cloud, hopsworks.ai.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1900, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Jim Dowling" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/V8KMO3wZeUE/maxresdefault.webp", + "title": "Hopsworks.AI - A feature Store for Machine Learning", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=V8KMO3wZeUE" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/madelon-hulsebos-tomislav-suhina-joost-boonzajer-flaes-keep-the-data-flowing-pydata-fest-ams.json b/pydata-amsterdam-2020/videos/madelon-hulsebos-tomislav-suhina-joost-boonzajer-flaes-keep-the-data-flowing-pydata-fest-ams.json new file mode 100644 index 000000000..e853a86a7 --- /dev/null +++ b/pydata-amsterdam-2020/videos/madelon-hulsebos-tomislav-suhina-joost-boonzajer-flaes-keep-the-data-flowing-pydata-fest-ams.json @@ -0,0 +1,38 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nMadelon Hulsebos, Tomislav Suhina & Joost Boonzajer Flaes - Keep the Data Flowing | PyData Fest Amsterdam 2020\n\nData scientist and engineers waste too much time on data issues and do not get to focus on developing and productionizing models. Potential causes range from mistyped customer IDs in Excel to incomplete and duplicate data entries. What follows is an inefficient back-and-forth process where we explore the data, summarize data issues, and send it back to the data owner through multiple iterations. This process drains time, energy, drives costs, and increases the chances of projects failing completely.\n\nAll ML pipelines make assumptions on the structure of the data being used. Once those assumptions are violated, pipelines break or models produce incorrect output. In this workshop, you will learn how to deploy Great Expectations for automating data validation, facilitating hand-offs from data owner to data scientist/engineer, and how to integrate Great Expectations into ML pipelines.\n\nThe workshop consists of an introduction to the package, live demonstration, and hands-on session. During the hands-on session, you will solve a data puzzle for which they will receive a messy data file and a set of data expectations. When you solve the puzzle using Great Expectations, you will be rewarded with a good functioning pipeline.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 5645, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Madelon Hulsebos", + "Tomislav Suhina", + "Joost Boonzajer Flaes" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/aRwZ1Lfq1CI/maxresdefault.webp", + "title": "Keep the Data Flowing", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=aRwZ1Lfq1CI" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/markus-loning-introduction-to-machine-learning-with-time-series-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/markus-loning-introduction-to-machine-learning-with-time-series-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..adf8d62b8 --- /dev/null +++ b/pydata-amsterdam-2020/videos/markus-loning-introduction-to-machine-learning-with-time-series-pydata-fest-amsterdam-2020.json @@ -0,0 +1,40 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nMarkus Loning - Introduction to Machine Learning with Time Series | PyData Fest Amsterdam 2020 \n\nTime series are ubiquitous in real-world applications, but often add considerable complications to data science workflows. What\u2019s more, most available machine learning toolboxes (e.g. scikit-learn) are limited to the tabular setting, and cannot easily be applied to time series data.\n\nIn this tutorial, you\u2019ll learn how to apply common machine learning techniques to time series and how to extend available toolkits. This is a beginner-friendly tutorial: we assume familiarity with scikit-learn, but no prior experience with time series.\n\nTo start, you\u2019ll learn how to distinguish between different kinds of temporal data and associated learning tasks, such as forecasting and time series classification. You\u2019ll then learn how to solve these tasks with machine learning techniques specific to time series data, including:\n\nState-of-the-art algorithms for time series classification and regression, Reduction strategies, i.e. solving a complex learning tasks by decomposing it into simpler tasks, e.g. solving forecasting via regression, Composite strategies like ensembling and pipelining, as well as data transformations like detrending and feature extraction. We\u2019ll work through all of them step by step and make use of interactive Jupyter notebooks and sktime, a new scikit-learn compatible toolbox for machine learning with time series (https://github.com/alan-turing-institute/sktime).\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 5234, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://github.com/alan-turing-institute/sktime", + "url": "https://github.com/alan-turing-institute/sktime" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Markus Loning" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/Wf2naBHRo8Q/maxresdefault.webp", + "title": "Introduction to Machine Learning with Time Series", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=Wf2naBHRo8Q" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/max-gendler-supporting-business-ethics-and-governance-with-data-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/max-gendler-supporting-business-ethics-and-governance-with-data-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..b3f9d3d45 --- /dev/null +++ b/pydata-amsterdam-2020/videos/max-gendler-supporting-business-ethics-and-governance-with-data-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\nMax Gendler - Supporting Business Ethics and Governance with Data | PyData Fest Amsterdam 2020\n\nInterviewed by Vincent Warmeerdam\n\nPrivacy, data governance, and ethics have all become essential topics in a modern data-driven company. But what even are they? And how do you get started with them?\n\nWe regularly get asked what data governance is. By definition, it\u2019s a combination of three things: formalizing behaviors, holding people accountable, and supporting ethics at scale. But what does that really mean and how do you put it into practice? We like to think of it as the standardization of work, both the setting of standards and testing for them to ensure that they are applied, while simultaneously getting people to want to do the right thing. In a number of ways, governance is a giant design problem. How can we make the right thing easy?\n\nIn this talk I\u2019ll go into more detail of how we\u2019ve put this into practice at The Times, including challenges we faced along the way and key lessons learned. For example, how we worked together with our marketing and advertising teams to create rulebooks for safe, secure, and ethical data processing. I\u2019ll also focus specifically on how data analytics supports our mission.\n\nMy hope is that this talk will provide more clarity on an area of work that very much tends to feel fuzzy and seemingly-overwhelming, and in turn encourage other companies to consider a data governance program of their own.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1851, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Max Gendler" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/80k2yDRFhwI/maxresdefault.webp", + "title": "Supporting Business Ethics and Governance with Data", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=80k2yDRFhwI" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/naomi-saphra-keynote-accessible-means-hackable-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/naomi-saphra-keynote-accessible-means-hackable-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..1d7710a66 --- /dev/null +++ b/pydata-amsterdam-2020/videos/naomi-saphra-keynote-accessible-means-hackable-pydata-fest-amsterdam-2020.json @@ -0,0 +1,38 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nNaomi Saphra (Keynote) - Accessible Means Hackable | PyData Fest Amsterdam 2020 \n\nIn 2015, after over a decade of programming, I lost the ability to type. Confronted with a programmer\u2019s worst nightmare, I began the slow process of learning to dictate code. While customizing my environment and relying on configurations and scripts from a wider voice coding community, I simultaneously was confronted with paternalistic attitudes towards disabled people, attached to a framing of accessibility as \u201caccommodation\u201d. Often, accommodations and products for disabled people have a rigid model for their use \u2013 but the needs of blind people are just as diverse as the needs of those with sight, and disabled people are perfectly capable of improving on the use model that you offer to them. This is a story and a call for accessible systems that are open and adaptable, that allow people like me the agency to improve the tools they use.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 2790, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Naomi Saphra" + ], + "tags": [ + "Keynote" + ], + "thumbnail_url": "https://i.ytimg.com/vi_webp/BKYWt8B9hgs/maxresdefault.webp", + "title": "Accessible Means Hackable", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=BKYWt8B9hgs" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/ondrej-kokes-high-performance-data-loss-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/ondrej-kokes-high-performance-data-loss-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..88ed21a38 --- /dev/null +++ b/pydata-amsterdam-2020/videos/ondrej-kokes-high-performance-data-loss-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\n\nOndrej Kokes - High Performance Data Loss | PyData Fest Amsterdam 2020\n\nSay I give you a CSV with business orders, there are just three of them, the business is just taking off. Pandas tells you the average purchase is for $45, but you can equally use Excel, which gives you the same answer. In anticipation of a rosy future, you decide to use a Big Data Tool. You load it up and process the very same CSV and you report the business is actually doing thousands of orders for millions of dollars.\n\nWhat is this sorcery? Did I just hijack your analysis by \u201chacking\u201d a CSV? Are big data tools broken? Can this happen in reality?\n\nWith the emergence of big-ish data, lots of tech has focused on the performance side of things. While more performance should be better than less performance, it\u2019s not all roses. When evaluating these technologies, we\u2019ve often stumbled upon integrity issues, sometimes to leading massive data losses. Or, as illustrated above, it can lead to strange data\u2026 gains.\n\nIn this talk, I\u2019ll go over several implementation details that can lead to a large data loss without triggering any warnings or errors. We\u2019ll go over a few cases (with data and code examples), but the main ideas are as follows:\n\ncorrectness should always trump performance - always make sure you\u2019re getting the right results, only then focus on performance \u201cexplicit is better than implicit\u201d - this Zen of Python quote is not just about code clarity, it\u2019s useful when using data processing tools with hidden logic fail early, fail often - would you like a pipeline that never fails, but produces garbage, or would you prefer to be paged every now and then, because of an issue? The main takeaway is that you should understand the abstractions you\u2019re using to process your data, no matter what your role is. Every single step that is there between a data source and your report/analysis/database/sink should be understandable, predictable, and, most importantly, correct. After all, our job as data guardians is to deliver data things reliably and correctly - our customer doesn\u2019t care if it\u2019s in the shiniest new Apache tool or in Cobol, orchestrated by Ada.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1749, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Ondrej Kokes" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/hoaMzebS_l4/maxresdefault.webp", + "title": "High Performance Data Loss", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=hoaMzebS_l4" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/roelof-pieters-watching-millions-of-trees-with-python-for-impact-and-profit-pydata-fest-ams.json b/pydata-amsterdam-2020/videos/roelof-pieters-watching-millions-of-trees-with-python-for-impact-and-profit-pydata-fest-ams.json new file mode 100644 index 000000000..b2cd7c9e8 --- /dev/null +++ b/pydata-amsterdam-2020/videos/roelof-pieters-watching-millions-of-trees-with-python-for-impact-and-profit-pydata-fest-ams.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\n\nRoelof Pieters - Watching Millions of Trees with Python: For Impact and Profit | PyData Fest AMS \n\nForests are essential to our future. More than 1.6 billion people depend on forests for food, water, fuel and medicines. They support 80% of non-human life on land and safeguard the climate by sequestering carbon. But forest fires, pests, diseases and especially deforestation lay waste to tens of millions of hectares a year. And under pressure of climate change this is only increasing.\n\nAt 20tree.ai we apply machine learning to high resolution satellite imagery, looking at trees and other vegetation all over the world constantly! In this talk I will dive into some of the work we do around monitoring both urban and rural green space. Secondly I will talk about how we bridge experimental R&D with applied ML work using nbdev, a framework made popular through the use of the second version of the popular fastai ML framework. And finally I will go over some of our continued challenges of dealing with large volumes of extremely noisy data, and reconciling this with the need to being cost-effective as a scrappy startup\n\nRoelof Pieters is CTO and co-founder of 20tree.ai, double Computer Science dropout (once as Bsc and more recently his Phd), has double degrees in Social/Development Anthropology and has the double distinction of running two earlier failed startups, most recently creative.ai. Roelof also heads up Sunshine Lab, a sustainable design studio, and only codes in python (of course)\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 2138, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Roelof Pieters" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/C4epqE7KcM4/maxresdefault.webp", + "title": "Watching Millions of Trees with Python: For Impact and Profit", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=C4epqE7KcM4" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/romeo-kienzler-privacy-by-design-machine-learning-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/romeo-kienzler-privacy-by-design-machine-learning-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..3b6b70305 --- /dev/null +++ b/pydata-amsterdam-2020/videos/romeo-kienzler-privacy-by-design-machine-learning-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 2639, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Romeo Kienzler" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/GuydU3AYFho/maxresdefault.webp", + "title": "Privacy by Design Machine Learning", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=GuydU3AYFho" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/sebastian-ramirez-serving-ml-easily-with-fastapi-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/sebastian-ramirez-serving-ml-easily-with-fastapi-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..45e21b236 --- /dev/null +++ b/pydata-amsterdam-2020/videos/sebastian-ramirez-serving-ml-easily-with-fastapi-pydata-fest-amsterdam-2020.json @@ -0,0 +1,40 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nSebastian Ramirez - Serving ML Easily With FastAPI | PyData Fest Amsterdam 2020\n\nYou know Machine Learning, your models are working well, the team likes the results\u2026 but now you need to \u201cserve\u201d them in an API so that others can interact with it (developers/frontend team/other systems).\n\nIn this talk, you will learn how to easily build a production-ready web (JSON) API for your ML models with FastAPI, including best practices by default. With very little code, you will get automatic/interactive documentation, data validation, authentication, open standards (OpenAPI, JSON Schema, OAuth2), and the best performance available in Python (on par with Go and NodeJS).\n\nOn top of that, you will have autocompletion and type checks in your editor, even for your own data, no matter the complexity of its shape.\n\nThe talk is targeted at Machine Learning practitioners that only know the basics of web development: what is an API, HTTP, JSON, etc. But can be appropriate for anyone interested in building web APIs. It\u2019s a very practical talk showing working code examples.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. \n\n0:00 Introduction\n1:45 About FastAPI\n2:24 FastAPI Basics\n3:22 Support for type annotations\n4:17 Concise backend code\n6:00 Challenge: serving a machine learning model\n7:33 How API routes and documentation work\n11:30 Parsing HTTP body and query\n18:05 Making ML calls from the API app\n23:20 Data validation of the HTTP body\n28:52 IDE auto-completion and type checks\n30:49 Documenting fields with metadata\n32:57 Declaring mandatory fields and validating requests\n36:56 Performance\n38:27 Additional features\n39:50 About typer and thing libraries\n41:30 Q&A\n\nS/o to https://github.com/mycaule for the video timestamps!\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 2703, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://github.com/mycaule", + "url": "https://github.com/mycaule" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Sebastian Ramirez" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/IdlT8l7kHT8/maxresdefault.webp", + "title": "Serving ML Easily With FastAPI", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=IdlT8l7kHT8" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/thijs-suijten-making-an-impact-with-duct-tape-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/thijs-suijten-making-an-impact-with-duct-tape-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..e2e16bb95 --- /dev/null +++ b/pydata-amsterdam-2020/videos/thijs-suijten-making-an-impact-with-duct-tape-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\nThijs Suijten - Making an Impact with Duct Tape | PyData Fest Amsterdam 2020\n\nAt Hack The Planet we are using our technical skills for the better. We have been working on many different challenges using various technologies like virtual reality to combat loneliness and autonomous flying drones to monitor forest fires. For our latest project we have developed a sensor that can detect mobile phones of poachers.\n\nThe system gathers data from the sensors. With analyses we can monitor and triangulate locations of suspicious activities. The data is really valuable for rangers on the ground and we are looking for ways to get more insights out of it. Think about detecting patterns and predicting poaching activity.\n\nI will share what we have so far and I\u2019d love to hear your ideas on getting the most out of this system to help rangers on the ground to protect elephants and rhinos that are facing extinction.\n\n=\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1550, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Thijs Suijten" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/MBgadBMANpk/maxresdefault.webp", + "title": "Making an Impact with Duct Tape", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=MBgadBMANpk" + } + ] +} diff --git a/pydata-amsterdam-2020/videos/tomas-sostak-popmon-population-shift-monitoring-made-easy-pydata-fest-amsterdam-2020.json b/pydata-amsterdam-2020/videos/tomas-sostak-popmon-population-shift-monitoring-made-easy-pydata-fest-amsterdam-2020.json new file mode 100644 index 000000000..0b46355d9 --- /dev/null +++ b/pydata-amsterdam-2020/videos/tomas-sostak-popmon-population-shift-monitoring-made-easy-pydata-fest-amsterdam-2020.json @@ -0,0 +1,36 @@ +{ + "description": "PyData is excited to announce PyData Global, November 11th - 15th! Tickets are now available: https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases\nPart of an underrepresented group in tech? PyData Global is offering Diversity Scholarships. Applications close September 30th: https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform\n\nTomas Sostak - Popmon: Population Shift Monitoring Made Easy | PyData Fest Amsterdam 2020\n\nTracking model performance is crucial to guarantee that a model behaves as designed initially. Predictions may be way ahead in time, so the performance can only be verified later, for example, in one year. Taking actions at that point might be already too late. Typical model performance questions are: is the model performing as expected, and are predictions made on current incoming data still valid?\n\nModel performance depends directly on the data used for training and the data to make predictions. Changes in the latter (e.g. certain word frequency, user demographics, etc.) can affect the performance and make predictions unreliable. Given that input data often change over time, it is important to track changes in both input distributions and delivered predictions periodically, and when they differ significantly - take actions. For example, diagnose and retrain an incorrect model in production.\n\nTo make monitoring both more consistent and semi-automatic, at ING we have developed a generic Python package called \u201cpopmon\u201d to monitor the stability of data populations over time, using techniques from statistical process control. In this talk, the speaker will present multiple scenarios of population shift, the motivation and challenges of population monitoring, as well as our open-source solution to these.\n\n\nwww.pydata.org\r\n\nPyData is an educational program of NumFOCUS, a 501(c)3 non-profit organization in the United States. PyData provides a forum for the international community of users and developers of data analysis tools to share ideas and learn from each other. The global PyData network promotes discussion of best practices, new approaches, and emerging technologies for data management, processing, analytics, and visualization. PyData communities approach data science using many languages, including (but not limited to) Python, Julia, and R. \r\n\nPyData conferences aim to be accessible and community-driven, with novice to advanced level presentations. PyData tutorials and talks bring attendees the latest project features along with cutting-edge use cases. 00:00 Welcome!\n00:10 Help us add time stamps or captions to this video! See the description for details.\n\nWant to help add timestamps to our YouTube videos to help with discoverability? Find out more here: https://github.com/numfocus/YouTubeVideoTimestamps", + "duration": 1939, + "language": "eng", + "recorded": "2020-06-15", + "related_urls": [ + { + "label": "Conference Website", + "url": "https://datasciencedistrict.nl/pydata-festival-amsterda/" + }, + { + "label": "https://github.com/numfocus/YouTubeVideoTimestamps", + "url": "https://github.com/numfocus/YouTubeVideoTimestamps" + }, + { + "label": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform", + "url": "https://docs.google.com/forms/d/e/1FAIpQLSfcFaTqVFjMa6kWlLPeEynEcbp1WrCxyxMGyyh4BP33eAviaA/viewform" + }, + { + "label": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases", + "url": "https://global.pydata.org/pages/tickets.html#pricing-and-ticket-purchases" + } + ], + "speakers": [ + "Tomas Sostak" + ], + "tags": [], + "thumbnail_url": "https://i.ytimg.com/vi_webp/HE-3YeVYqPY/maxresdefault.webp", + "title": "Popmon: Population Shift Monitoring Made Easy", + "videos": [ + { + "type": "youtube", + "url": "https://www.youtube.com/watch?v=HE-3YeVYqPY" + } + ] +}