{"$schema": "https://c3voc.de/schedule/schema.json", "generator": {"name": "pretalx", "version": "2026.1.1"}, "schedule": {"url": "https://pretalx.com/pyconhk2024/schedule/", "version": "0.17", "base_url": "https://pretalx.com", "conference": {"acronym": "pyconhk2024", "title": "PyCon Hong Kong 2024", "start": "2024-11-16", "end": "2024-11-17", "daysCount": 2, "timeslot_duration": "00:05", "time_zone_name": "Asia/Hong_Kong", "colors": {"primary": "#7CC0C0"}, "rooms": [{"name": "LT8", "slug": "3034-lt8", "guid": "d23185e0-ee92-5f87-aef4-b124a0b81107", "description": "Yeung Kin Man Academic Building, City University of Hong Kong", "capacity": 120}, {"name": "LT9", "slug": "3033-lt9", "guid": "58b3323d-7a4f-5b06-9a58-b2ddef8be232", "description": "Yeung Kin Man Academic Building, City University of Hong Kong", "capacity": 140}, {"name": "LT7", "slug": "3415-lt7", "guid": "4e1bc15c-5af4-5771-a26e-e49684afec2c", "description": "Yeung Kin Man Academic Building, City University of Hong Kong", "capacity": 120}], "tracks": [{"name": "DevOps", "slug": "5106-devops", "color": "#F865DB"}, {"name": "Libraries / Tools", "slug": "5108-libraries-tools", "color": "#3CA7F4"}, {"name": "Lightning \u26a1", "slug": "5104-lightning", "color": "#D09800"}, {"name": "LLM", "slug": "5102-llm", "color": "#C13DFE"}, {"name": "Performance", "slug": "5107-performance", "color": "#3BB06A"}, {"name": "Perspectives", "slug": "5105-perspectives", "color": "#FF4500"}], "days": [{"index": 1, "date": "2024-11-16", "day_start": "2024-11-16T04:00:00+08:00", "day_end": "2024-11-17T03:59:00+08:00", "rooms": {"LT9": [{"guid": "d1bc2c5f-1f99-5e48-9188-1958409e0079", "code": "BUTWTL", "id": 56372, "logo": "https://pretalx.com/media/pyconhk2024/submissions/BUTWTL/logo_with_text_rOR5xUv.gif", "date": "2024-11-16T10:00:00+08:00", "start": "10:00", "duration": "00:10", "room": "LT9", "slug": "pyconhk2024-56372-opening-remarks-by-pycon-hk", "url": "https://pretalx.com/pyconhk2024/talk/BUTWTL/", "title": "Opening Remarks by PyCon HK", "subtitle": "", "track": null, "type": "Short talk", "language": "en", "abstract": "Opening remarks and announcement", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "UZNN3F", "name": "Scotty Kwok", "avatar": "https://pretalx.com/media/avatars/UZNN3F_7kjlL0I.webp", "biography": "PyCon Hong Kong 2024 Chairman\n\nScotty Kwok is a software developer and founder of tech company. He enjoys writing software and building hardware to solve problem in his job and leisure time. He is currently working in Sebit Company Limited (www.sebit.world) as the CTO and founder, specialised in Al/computer vision. Scotty has been the speaker in several PyCons (PyCon Hong Kong 2018 & 2021 and PyCon APAC 2021) and also program committee in PyCon Hong Kong 2020,2022,2023.\n\nLinkedin:  https://www.linkedin.com/in/scottykwok/", "public_name": "Scotty Kwok", "guid": "1c8530b9-e696-54e3-9386-74fa246e223e", "url": "https://pretalx.com/pyconhk2024/speaker/UZNN3F/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/BUTWTL/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/BUTWTL/", "attachments": []}, {"guid": "ba85179a-0d08-502a-a5fe-3f54e49c8d95", "code": "QVV8XV", "id": 56575, "logo": "https://pretalx.com/media/pyconhk2024/submissions/QVV8XV/CityU_Logo_0uSHmkn.svg", "date": "2024-11-16T10:10:00+08:00", "start": "10:10", "duration": "00:10", "room": "LT9", "slug": "pyconhk2024-56575-opening-remarks-by-cityu-hk", "url": "https://pretalx.com/pyconhk2024/talk/QVV8XV/", "title": "Opening Remarks by CityU HK", "subtitle": "", "track": null, "type": "Lightning talk", "language": "en", "abstract": "Opening Speech by College of Computing CityU HK", "description": "Opening Speech by College of Computing CityU HK", "recording_license": "", "do_not_record": false, "persons": [{"code": "VLDQSC", "name": "Dr. Ray Cheung", "avatar": "https://pretalx.com/media/avatars/VLDQSC_H5qIruD.webp", "biography": "Prof CHEUNG, Ray CC\nBSc MPhil CUHK, PhD Imperial College London\n\nAssociate Provost (Digital Learning) and Professor\n\nResearch Interests:\nReconfigurable Trusted Computing; FPGA/ASIC; RISC-V / Processor Architecture; Exact / Approximate Arithmetic; System-on-Chip (SoC)", "public_name": "Dr. Ray Cheung", "guid": "7205982b-9ccf-5004-9bac-550d185532f7", "url": "https://pretalx.com/pyconhk2024/speaker/VLDQSC/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/QVV8XV/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/QVV8XV/", "attachments": []}, {"guid": "ffeab802-859c-5e59-8a18-186afc1b1993", "code": "XAFXDU", "id": 54806, "logo": null, "date": "2024-11-16T10:25:00+08:00", "start": "10:25", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-54806-keynote-pycon-hong-kong-the-story", "url": "https://pretalx.com/pyconhk2024/talk/XAFXDU/", "title": "[Keynote] PyCon Hong Kong - the Story", "subtitle": "", "track": "Perspectives", "type": "Lightning talk", "language": "en", "abstract": "[Pre-recorded Video] Passionate volunteer start the PyCon HK in Hong Kong in 2015, which turns the local python community to its next decade. In this short video, Sammy tells the story of PyCon HK and how did he involve it.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "ZXDBDT", "name": "Sammy Fung", "avatar": "https://pretalx.com/media/avatars/ZXDBDT_wrzs6Ih.webp", "biography": "Sammy is the Fellow member of Python Software Foundation, he is the founder of PyCon HK and its former conference chair. He is also President of Open Source Hong Kong and Founder of Open Platform Society.", "public_name": "Sammy Fung", "guid": "afeabc26-89f2-5eb1-aa9e-690740e6c860", "url": "https://pretalx.com/pyconhk2024/speaker/ZXDBDT/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/XAFXDU/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/XAFXDU/", "attachments": []}, {"guid": "3919a40f-3b24-563b-84a9-a5f02cf87d71", "code": "W9X8DD", "id": 52540, "logo": null, "date": "2024-11-16T10:30:00+08:00", "start": "10:30", "duration": "00:30", "room": "LT9", "slug": "pyconhk2024-52540-sponsored-keynote-large-language-models-optimization-with-python", "url": "https://pretalx.com/pyconhk2024/talk/W9X8DD/", "title": "[Sponsored Keynote] Large Language Models Optimization with Python", "subtitle": "", "track": "LLM", "type": "Talk", "language": "en", "abstract": "This talk will cover various aspects of optimizing Large Language Models (LLMs) with Python, including quick start, availability optimization, and throughput optimization. Explore cutting-edge techniques involved in areas such as model compilation, model compression, model inference batching, distributed training, and Large Model Inference (LMI) containers. Discover practical examples of optimizing some open-source models using techniques like LMI containers, Low-Rank Adaptation (LoRA), Fully Sharded Data Parallelism (FSDP), Paged Attention, Rolling Batch, and more.", "description": "The talk will delve into techniques and strategies for optimizing Large Language Models (LLMs) with Python. It focuses on addressing the computational challenges associated with training and deploying these models efficiently.\n\nOne key aspect discussed is model parallelism, which involves distributing the model across multiple devices or instances to overcome memory limitations. Tensor parallelism, a form of model parallelism, is explored, where individual tensors are split across devices. Pipeline parallelism, another technique, enables concurrent execution of different model components on separate devices.\n\nThe talk will also cover distributed training strategies, such as data parallelism and tensor-parallel language models, which leverage multiple devices to accelerate training. Techniques for reducing memory footprint, like quantization, pruning, and distillation, are explored as means to optimize LLM deployment.\n\nOptimizations for inference are also discussed, including model compression methods like quantization-aware training, pruning, and distillation. Kernel fusion, a technique that combines multiple operations into a single optimized kernel, is highlighted for improving inference performance. Additionally, the document explores accelerated inference using hardware accelerators.\n\nThe talk aims to provide guidance on leveraging Python's capabilities for efficient LLM training, deployment, and inference. It covers a range of strategies and techniques to address the computational challenges associated with these models, enabling researchers and practitioners to optimize LLMs for improved performance and cost-effectiveness.", "recording_license": "", "do_not_record": false, "persons": [{"code": "TWFLNL", "name": "Haowen Huang", "avatar": "https://pretalx.com/media/avatars/TWFLNL_ZJxnQzW.webp", "biography": "Haowen Huang is currently a Senior Developer Advocate at Amazon Web Services (AWS). He has over 20 years of experience in the telecommunications, internet, and cloud computing industries. He has previously worked for companies such as Microsoft, Sun, and China Telecom. He currently focuses on creating and sharing technical content in the areas of generative AI, large language models (LLMs), machine learning, and data science, and empowering developers around the world.", "public_name": "Haowen Huang", "guid": "5093ad3c-3f88-5638-a691-a537d516e685", "url": "https://pretalx.com/pyconhk2024/speaker/TWFLNL/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/W9X8DD/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/W9X8DD/", "attachments": []}, {"guid": "6639a1a8-bf57-51d5-b519-e36c9b16993a", "code": "RUHCB8", "id": 56461, "logo": "https://pretalx.com/media/pyconhk2024/submissions/RUHCB8/images_qcKRBEw.png", "date": "2024-11-16T11:10:00+08:00", "start": "11:10", "duration": "00:15", "room": "LT9", "slug": "pyconhk2024-56461-sign-and-verify-python-package-with-sigstore-keyless-signing", "url": "https://pretalx.com/pyconhk2024/talk/RUHCB8/", "title": "Sign and verify Python package with Sigstore keyless signing", "subtitle": "", "track": "Libraries / Tools", "type": "Short talk", "language": "zh-hant", "abstract": "Organizations are challenged in ensuring that the container image they are deploying is exactly what was produced in development and nothing has changed before it runs in production. Cryptographic signing of container images helps to verify the integrity of the image and makes sure it has not been tampered since its creation. Verification of the image signature also confirms that the expected software creator, whose identity was certified at the moment of signing, published the container image in their possession. \nIn this presentation, I will use an open source project \u201cSigstore\u201d: a cryptographic signature tool that is for improving software supply chain security. The Sigstore framework empowers software developers and consumers to securely sign and verify software artifacts. Signatures are generated with ephemeral signing keys so there\u2019s no need to manage keys. Signing events are recorded in a tamper-resistant public log so software developers can audit signing events.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "XNBL77", "name": "Frankie Ng", "avatar": "https://pretalx.com/media/avatars/XNBL77_ibGbRz1.webp", "biography": "Frankie Ng - Associate Principal Solution Architect\nFrankie Ng is an IT professional focusing on Open Source technology. Frankie has years of experience in IT infrastructure, automation, IaaS and cloud. He believes Open Source, sharing and community are the keys for technology innovation.\n\nFrankie joined Red Hat in 2016 as Solution Architect covering Hong Kong and Taiwan. He helped enterprises to drive digital transformation projects including hybrid cloud strategy, DevOps and container adoption and IT automation.", "public_name": "Frankie Ng", "guid": "f3e4939f-5de8-5fa6-b64e-dafd2462ec7b", "url": "https://pretalx.com/pyconhk2024/speaker/XNBL77/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/RUHCB8/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/RUHCB8/", "attachments": []}, {"guid": "a3353062-836f-531e-bab7-667c7abd1c84", "code": "NA7LPP", "id": 53881, "logo": null, "date": "2024-11-16T11:25:00+08:00", "start": "11:25", "duration": "00:15", "room": "LT9", "slug": "pyconhk2024-53881-network-automation-for-improved-efficiency-using-ansible-and-python", "url": "https://pretalx.com/pyconhk2024/talk/NA7LPP/", "title": "Network Automation for Improved Efficiency using Ansible and Python", "subtitle": "", "track": "DevOps", "type": "Short talk", "language": "en", "abstract": "This presentation highlights how network automation with Python and Ansible enhances management efficiency. It addresses the challenges of traditional manual network tasks, which are time-consuming, error-prone, and hard to scale. By showcasing Python's and Ansible's capabilities, the presentation demonstrates how automation leads to improved efficiency, reduced errors, and faster deployments, allowing network administrators to focus on critical tasks and ensuring a more reliable and secure network environment.", "description": "This presentation explores how network automation can significantly enhance management efficiency. Traditional manual network configuration, provisioning, and maintenance are time-consuming, error-prone, and difficult to scale with network growth.\n\nAnsible, a popular open-source tool, is introduced as a key component for automating network configurations and workflows. We explain Ansible's agentless architecture and the use of playbooks\u2014YAML files that define automated tasks for network devices.\n\nThrough code examples and a sample playbook, we demonstrate how Python scripts can interact with network devices and be integrated into Ansible playbooks, enabling the automation of complex tasks efficiently.", "recording_license": "", "do_not_record": false, "persons": [{"code": "DFNNGL", "name": "TIMOTHY LAM", "avatar": "https://pretalx.com/media/avatars/DFNNGL_JJXH9fC.webp", "biography": "I am a seasoned IT professional with over 20 years of experience, certified in PMP, CISM,, CISA and TOGAF, and recognized as an Open Group Distinguished IT Technical Specialist. \n\nAs the Strategic Business Development Director at Red Hat, I drive transformation and revenue growth through open-source solutions, enhancing customer experience and market presence.", "public_name": "TIMOTHY LAM", "guid": "db9f73b9-c337-5a3f-81d1-5fd5c260c5b6", "url": "https://pretalx.com/pyconhk2024/speaker/DFNNGL/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/NA7LPP/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/NA7LPP/", "attachments": []}, {"guid": "2e55aac0-daf5-5e17-9f92-46f789fd165f", "code": "YXQRCF", "id": 55026, "logo": null, "date": "2024-11-16T11:50:00+08:00", "start": "11:50", "duration": "00:30", "room": "LT9", "slug": "pyconhk2024-55026-build-ai-powered-rag-application-with-mysql9-0", "url": "https://pretalx.com/pyconhk2024/talk/YXQRCF/", "title": "Build AI-powered RAG application with MySQL9.0", "subtitle": "", "track": "LLM", "type": "Talk", "language": "en", "abstract": "In this session, we will show you how you can quickly build an AI-powered RAG application with MySQL9.0 and python:\n* Build your own document repository in vector store in MySQL 9.0\n* Integrate LLM in your application to process questions\n* Generate context-aware answers from your vector store", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "HCKY7M", "name": "Ryan Kuan", "avatar": "https://pretalx.com/media/avatars/HCKY7M_teDkmfM.webp", "biography": "Ryan Kuan is a Cloud Solutions Engineer who helps organisations to adopt cloud-native data architecture across the Asia Pacific regions at Oracle MySQL.  \nRyan believes that organisations adopting cloud technology can focus and innovate their business entirely without worrying about the underlying IT infrastructure the business depends upon. He has helped many organizations adopt cloud-native data science capabilities to discover invaluable information and data insights to solve complex business problems. \nPrior to joining Oracle MySQL, he worked in various roles such as Cloud Advisor, Solutions Architect, and Database Engineer at IBM, BEA Systems, and Informix respectively, he achieved various professional accreditations such as TOGAF, ITIL, and IBM certified professional architect.", "public_name": "Ryan Kuan", "guid": "294c0794-efbf-5f42-9b82-c0365aab56a0", "url": "https://pretalx.com/pyconhk2024/speaker/HCKY7M/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/YXQRCF/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/YXQRCF/", "attachments": []}, {"guid": "dc38e9d3-2663-5c2e-bec2-62f6430b70d4", "code": "THDBMS", "id": 53231, "logo": null, "date": "2024-11-16T12:25:00+08:00", "start": "12:25", "duration": "00:15", "room": "LT9", "slug": "pyconhk2024-53231-two-roads-diverged-the-gap-between-web-development-and-data-science-in-python", "url": "https://pretalx.com/pyconhk2024/talk/THDBMS/", "title": "Two roads diverged: the gap between web development and data science in Python", "subtitle": "", "track": "Perspectives", "type": "Short talk", "language": "en", "abstract": "While being a Data Scientist was once touted the sexiest job of the 21st century, how different is the life of a Python Web Developer? The author, who has served in both roles, shares her take on the difference (or lack thereof) between the two professions.", "description": "## Goal\n\nThis talk aims to illustrate the differences and similarities between the Data Scientist and the Web Developer in Python. This talk will be of interest to an audience who is contemplating which path to take, or simply curious about how Python is used in different capacities.\n\n\n## Outline\n\n- Part 1 (5 min): Mutual Myths. In this section I will discuss some common misconceptions about being a Data Scientist or Web Developer.\n- Part 2 (5 min): Transferrable Skills. In this section I will focus on the day-to-day responsibilities of the Web Developer, highlighting skills that are transferrable or learnable by the Data Scientist.\n- Part 3 (5 min): Recommendations. In this section, I will attempt to make some actionable recommendations for those contemplating to switch to the Software Engineering path in Python.", "recording_license": "", "do_not_record": false, "persons": [{"code": "LJCYKL", "name": "Chan Sau Yee", "avatar": "https://pretalx.com/media/avatars/LJCYKL_3zd11kY.webp", "biography": "Based in Tokyo, Sau Yee is a practical Python practitioner with a background in Urban Engineering. She believes coding is for everyone. She previously spoke at PyCon APAC 2023.", "public_name": "Chan Sau Yee", "guid": "ec0dd8c1-d1bf-5aa6-9911-77dab7c26547", "url": "https://pretalx.com/pyconhk2024/speaker/LJCYKL/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/THDBMS/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/THDBMS/", "attachments": []}, {"guid": "67b24fe1-2a51-5fcf-add6-69388283eb97", "code": "HN3F8L", "id": 55032, "logo": null, "date": "2024-11-16T12:40:00+08:00", "start": "12:40", "duration": "00:15", "room": "LT9", "slug": "pyconhk2024-55032-end-to-end-gpu-acceleration-for-scikit-learn-and-xgboost", "url": "https://pretalx.com/pyconhk2024/talk/HN3F8L/", "title": "End-to-end GPU Acceleration for scikit-learn and XGBoost", "subtitle": "", "track": "Performance", "type": "Short talk", "language": "en", "abstract": "With the ever-growing data size and the increasing complexity of data science workflows, high-performance computing becomes crucial for data scientists to tackle real-world problems. Attendees will learn to leverage RAPIDS projects with GPUs to accelerate and scale up scikit-learn and XGBoost model training workflows.", "description": "This talk will explore GPU acceleration beyond deep learning models and provide an overview of GPU-accelerated data science workflows. Python\u2019s rich ecosystem has made it one of the most popular programming languages today. RAPIDS offers a suite of open-source Python libraries and primitives to accelerate core data science libraries, including pandas, scikit-learn, and NetworkX, without requiring any code changes. Additionally, the latest XGBoost integrates with RAPIDS to deliver a fully accelerated model training experience. We will demonstrate how to enable a GPU-accelerated end-to-end pipeline for training scikit-learn and XGBoost models, highlighting the significant speed improvements for various scikit-learn estimators. Then, we will delve into new features that facilitate scaling XGBoost using the latest NVIDIA Grace Hopper superchip to handle large datasets. We can discuss some details about the implementation and share our experience with GPU acceleration. Finally, we will outline our roadmap for future developments.", "recording_license": "", "do_not_record": false, "persons": [{"code": "Z9NYAC", "name": "Jiaming Yuan", "avatar": "https://pretalx.com/media/avatars/Z9NYAC_mAJt2NX.webp", "biography": "Engineer, RAPIDS, NVIDIA", "public_name": "Jiaming Yuan", "guid": "11c17f4d-7365-5712-aa12-0f9f636b4325", "url": "https://pretalx.com/pyconhk2024/speaker/Z9NYAC/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/HN3F8L/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/HN3F8L/", "attachments": []}, {"guid": "625983fd-d96b-53d0-88fc-13cae2167e83", "code": "PCZC3H", "id": 57439, "logo": null, "date": "2024-11-16T14:00:00+08:00", "start": "14:00", "duration": "00:30", "room": "LT9", "slug": "pyconhk2024-57439-python-to-deploy-enterprise-grade-delta-lake-on-aws", "url": "https://pretalx.com/pyconhk2024/talk/PCZC3H/", "title": "Python to Deploy Enterprise-Grade Delta Lake on AWS", "subtitle": "", "track": "Libraries / Tools", "type": "Talk", "language": "en", "abstract": "This session explores how enterprises can build robust transactional data lakes using the open-source Delta Lake format and Python tools. The presenters will first discuss the exponential growth in enterprise data volumes and how data lakes provide a compelling solution to cost-effectively retain and extract value from vast amounts of structured and unstructured data.\nThe session outlines key limitations of traditional data lakes, such as the lack of database-like capabilities for efficient updates, maintaining performance at scale, and ensuring data consistency.\nTo address these challenges, the session will showcase how the Delta Lake format, along with complementary Python tools like PySpark and Delta-rs, can be leveraged on AWS to build highly optimized and manageable data lake architectures. The presenters will dive into two real-world use cases, covering both large-scale batch processing and smaller-scale data workloads, highlighting best practices and architectural patterns for Python developers.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "NB3CPZ", "name": "Alan, Ka Hei Ng", "avatar": "https://pretalx.com/media/avatars/NB3CPZ_aHBqWlz.webp", "biography": "Alan is an Assistant Technical Manager at ATAL Engineering Group. He is specialised in the development of total solutions for smart buildings, covering the areas of energy optimisation, air conditioning, intelligent control, and automation.", "public_name": "Alan, Ka Hei Ng", "guid": "f3344ee6-b916-538e-bbf5-ecb214042a9c", "url": "https://pretalx.com/pyconhk2024/speaker/NB3CPZ/"}, {"code": "CAGBES", "name": "Jacky Kwok", "avatar": "https://pretalx.com/media/avatars/CAGBES_BOCY7dV.webp", "biography": "Jacky Kwok is an Enterprise Solutions Architect at Amazon Web Services, Hong Kong. With more than 10 years of experience, he possesses proficiency in a wide range of technology stacks, such as Java, Python, Node.js, MySQL, and PostgreSQL. Jacky is a seasoned architect with extensive hands-on experience in application development, Data Analytic and solution architecture.", "public_name": "Jacky Kwok", "guid": "62ac09bb-743f-5a54-a405-fe826966e4d9", "url": "https://pretalx.com/pyconhk2024/speaker/CAGBES/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/PCZC3H/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/PCZC3H/", "attachments": []}, {"guid": "ebe41312-abc8-522e-b7d8-8ef8efe8583f", "code": "ES7DKX", "id": 52073, "logo": null, "date": "2024-11-16T14:40:00+08:00", "start": "14:40", "duration": "00:30", "room": "LT9", "slug": "pyconhk2024-52073-autonomous-ai-agents-for-dummies", "url": "https://pretalx.com/pyconhk2024/talk/ES7DKX/", "title": "Autonomous AI Agents for Dummies", "subtitle": "", "track": "LLM", "type": "Talk", "language": "en", "abstract": "AI Agentic workflows will drive massive AI progress this year. This is what Professor Andrew Ng said about the rise of agents. With the growing popularity of large language models, Agents are what everyone is talking about. In simple terms, Agents can be defined as LLMs with the ability to self-reason and plan, just like humans. In my talk, I will focus on how to build an Autonomous Agentic workflow and the components required. Additionally, I will cover the concepts of planning and reasoning Agentic prompting such as REACT, LATS and so on to motivate the audience to stay updated with the Agentic world.", "description": "### Problem Statment \n\nLarge Language Models (LLMs) like GPT-4 have several limitations that hinder their full potential. They often struggle with maintaining contextual understanding over extended conversations, leading to disjointed or repetitive interactions. Additionally, LLMs can lack accuracy, fail to provide real-time information, self-reasoning to decompose while planning the task. This is where Agents comes. \n\nUnlike traditional LLMs, AI agents are designed to self-reason and plan, mimicking human cognitive processes. They can interact with their environment, make decisions, and take actions autonomously. This capability enables them to overcome some of the contextual and reasoning challenges that LLMs face, making them more suitable for complex, dynamic tasks. \n\n### My talk will cover:\n- How a simple execution of task is formed by humans?\n- Agentic Workflow and the major components required: This includes: Task, Memory, Tools, Agents, LLM and so on. \n- Planning and Reasoning: Under this I will cover Chain of thoughts, REACT, LATS prompt techniques, that is used to build Agentic workflow. \n- Conclusion", "recording_license": "", "do_not_record": false, "persons": [{"code": "XVM8TR", "name": "Tarun Jain", "avatar": "https://pretalx.com/media/avatars/XVM8TR_FTeacji.webp", "biography": "Tarun Jain is a Data Scientist at [AI Planet](https://aiplanet.com), a Belgium based AI Startup. He is also a renowned speaker and recognised as [Google Developer Expert in AI/ML](https://developers.google.com/profile/u/tarunjain). Furthermore, he has contributed to various Open Source projects and is currently part of [Google Summer of Code 2024 at RedHenLab](https://summerofcode.withgoogle.com/programs/2024/projects/8D9AhF8O). He is also a content creator at [AI with Tarun](https://www.youtube.com/@aiwithtarun) Youtube channel.", "public_name": "Tarun Jain", "guid": "3b5a6fe6-c494-585f-9f13-0163d24d933e", "url": "https://pretalx.com/pyconhk2024/speaker/XVM8TR/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/ES7DKX/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/ES7DKX/", "attachments": []}, {"guid": "ee229350-c9f1-5f24-8540-53e31c91f687", "code": "B9QPQF", "id": 52959, "logo": null, "date": "2024-11-16T15:15:00+08:00", "start": "15:15", "duration": "00:15", "room": "LT9", "slug": "pyconhk2024-52959-accelerating-python-s-performance-with-c-and-cython", "url": "https://pretalx.com/pyconhk2024/talk/B9QPQF/", "title": "Accelerating Python's performance with C and Cython", "subtitle": "", "track": "Performance", "type": "Short talk", "language": "en", "abstract": "Although Python is popular and known for rapid development and great ecosystem, performance may often be an issue when running certain types of tasks. For example, we ran into performance issues when we had to parse and chunk CSV files of arbitrary sizes.\n\nUtilising C for core functions and a wrapper with Cython, we were able to quickly build a lightweight Python module that improved the performance of our use case!\n\nThrough this talk, we'd demonstrate how tools like Cython could make Python even more powerful.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "YYZQ8P", "name": "Leo Chen", "avatar": "https://pretalx.com/media/avatars/YYZQ8P_gFOoqP9.webp", "biography": "Leo Chen is a software engineer in Bloomberg's Data Technologies Infrastructure Engineering group, where he works on data ETL pipelines and workflow orchestration platforms. Over the course of his seven-year career, he has experience with multiple programming languages, machine learning frameworks, and both frontend & backend development. He is a big Python enthusiast. Leo holds a master's degree in data science from the University of Sydney.", "public_name": "Leo Chen", "guid": "e7d30b9e-d2be-5c67-93b1-da671b262472", "url": "https://pretalx.com/pyconhk2024/speaker/YYZQ8P/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/B9QPQF/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/B9QPQF/", "attachments": []}, {"guid": "85c01247-5a6e-575f-af43-f0204456b14e", "code": "TDYGRG", "id": 53944, "logo": null, "date": "2024-11-16T16:00:00+08:00", "start": "16:00", "duration": "00:30", "room": "LT9", "slug": "pyconhk2024-53944-how-to-organize-and-deploy-your-python-applications-with-docker", "url": "https://pretalx.com/pyconhk2024/talk/TDYGRG/", "title": "How to organize and deploy your Python applications with Docker", "subtitle": "", "track": "DevOps", "type": "Talk", "language": "en", "abstract": "Deploying Python applications can be difficult. In this introductory talk, I will share what I learned to help you avoid common problems.  \nWe will learn how to set up your Python projects to make them easy to deploy in Docker containers, from simple scripts to medium-sized projects made of several packages.\nWe will also look at how to use Docker Compose and understand its strengths and limits.  \nBy the end of this talk, you will know how to deploy your Python applications using Docker easily and effectively.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "T7BWHY", "name": "Cristiano Pierandrei", "avatar": "https://pretalx.com/media/avatars/T7BWHY_nq1uLK4.webp", "biography": "Cristiano Pierandrei is a seasoned Technical Lead at Aicof, specializing in IT systems for public health with over six years of experience in IT and software development.   \nHolding a Master of Science in Computer Engineering, Cybersecurity, and Artificial Intelligence from Universit\u00e0 degli Studi di Cagliari, he also teaches Machine Learning and Deep Learning at ITS Angelo Rizzoli.   \nHis expertise spans Python, Machine and Deep Learning, Data Engineering, Software Architecture, and IoT. With a background in diverse domains like customs, taxes, energy, and healthcare, Cristiano is a versatile tech leader adept at both coding and team management, making him an asset for startups seeking adaptable technical expertise.", "public_name": "Cristiano Pierandrei", "guid": "5d3eb0e9-e2a8-5321-8f35-dac4358286f5", "url": "https://pretalx.com/pyconhk2024/speaker/T7BWHY/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/TDYGRG/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/TDYGRG/", "attachments": []}, {"guid": "f425eaa0-c837-5ef4-bb18-5bd70c45aa70", "code": "ZB8QGA", "id": 54239, "logo": null, "date": "2024-11-16T16:40:00+08:00", "start": "16:40", "duration": "00:30", "room": "LT9", "slug": "pyconhk2024-54239-algorithmic-artistry-musical-ideas-for-pythonists", "url": "https://pretalx.com/pyconhk2024/talk/ZB8QGA/", "title": "Algorithmic Artistry: Musical Ideas for Pythonists", "subtitle": "", "track": "Perspectives", "type": "Talk", "language": "en", "abstract": "The almighty Python language has earned its widespread popularity. Can we build a music machine with Python that creates captivating music, with mind-blowing sounds and instruments we haven't heard before? There are numerous Python libraries for music manipulation and generation. In this talk, we will explore interactions ranging from sound synthesis to algorithmic music making, catering to both coding musicians and musical coders, all within the Python ecosystem!\n(Materials are available as a Colab Notebook: https://tinyurl.com/pycon24-music )", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "C7XA9X", "name": "Chuck-jee Chau", "avatar": "https://pretalx.com/media/avatars/C7XA9X_i0xK3mq.webp", "biography": "A stage pianist/percussionist on both acoustic and virtual instruments, as well as a computer music researcher. While he often appears in local music performances, his research works have been published in the international conference proceedings and journals. Currently teaching at CUHK Computer Science and Engineering.", "public_name": "Chuck-jee Chau", "guid": "fc64f9f8-7d6a-5cce-8cc5-68509100508d", "url": "https://pretalx.com/pyconhk2024/speaker/C7XA9X/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/ZB8QGA/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/ZB8QGA/", "attachments": []}, {"guid": "e4d96f7e-7f8e-58ed-9848-06edb0edf21b", "code": "YPKQZM", "id": 52957, "logo": null, "date": "2024-11-16T17:20:00+08:00", "start": "17:20", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-52957-data-validation-in-python", "url": "https://pretalx.com/pyconhk2024/talk/YPKQZM/", "title": "Data Validation in Python", "subtitle": "", "track": "Lightning \u26a1", "type": "Lightning talk", "language": "en", "abstract": "For data engineers to set up reliable data pipelines, it is crucial to conduct validations at each step to ensure the high quality of the data. Great Expectations (GX) is an open source framework that provides an intuitive way -- Expectations -- to define and manage data quality.\nThis lighting talk will explore how to leverage Great Expectations to automate data quality checks and increase transparency in your data pipeline. To demonstrate GX's features, we will explore two examples of Expectations (basic and conditional).", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "M7BMDX", "name": "Meixin Wang", "avatar": "https://pretalx.com/media/avatars/M7BMDX_JQZEfz2.webp", "biography": "Meixin Wang is a data engineering analyst in Bloomberg's Data department in Hong Kong. She specializes in the Python programming language and has experience developing and growing automated processes and quality controls by using technology solutions for the company's Fixed Income data products. She is passionate about staying up-to-date with the latest technologies and trends in the field and will continue developing her skills to make a positive impact. She holds a master's degree in software engineering from Fudan University.", "public_name": "Meixin Wang", "guid": "83fa32e2-a539-5180-9e58-7d6b7bf78a6e", "url": "https://pretalx.com/pyconhk2024/speaker/M7BMDX/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/YPKQZM/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/YPKQZM/", "attachments": []}, {"guid": "edb99e80-0560-5d4c-b6f7-95eae84eaac9", "code": "87VP87", "id": 52951, "logo": null, "date": "2024-11-16T17:25:00+08:00", "start": "17:25", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-52951-async-all-the-way-fastapi-and-the-asgi-era", "url": "https://pretalx.com/pyconhk2024/talk/87VP87/", "title": "Async all the way: FastAPI and the ASGI era", "subtitle": "", "track": "Lightning \u26a1", "type": "Lightning talk", "language": "en", "abstract": "In the rapidly-evolving world of Python web development, the emergence of frameworks like FastAPI has changed how software engineers build highly-performant, asynchronous applications in Python. This lightning talk will explore how the FastAPI framework makes use of the power of an Asynchronous Server Gateway Interface (ASGI) web server to enable concurrent request handling, in contrast with the traditional Web Server Gateway Interface (WSGI) approach.\n\nThrough a live demonstration, the differences between WSGI and ASGI applications will be illustrated. Synchronous applications can be blocked by long-running tasks such as I/O operations, whereas asynchronous web servers handle requests concurrently even while the thread is occupied with different tasks.\n\nBy showcasing how FastAPI's design allows for concurrent processing of multiple requests without blocking, this talk will highlight the significant performance benefits and scalability advantages provided by ASGI-powered frameworks.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "3VET9Z", "name": "Taemin Ha", "avatar": "https://pretalx.com/media/avatars/3VET9Z_rtXmB07.webp", "biography": "Tae Min Ha is a software engineer across different technology domains. He has experiences with Python application development using REST API frameworks, machine learning operations (MLOps) using cloud automations, containerized deployments, and data mining. He has spent the last four years of his career as a Market Data Engineer with Bloomberg in Hong Kong, primarily owning a variety of market data feed applications across Asian exchanges. He is well versed in programming languages like C++11/14/17 and Python. Tae Min holds a B. Eng. in computer science from the University of Hong Kong.", "public_name": "Taemin Ha", "guid": "fdb97342-42ff-516b-9f5b-118a1be02a85", "url": "https://pretalx.com/pyconhk2024/speaker/3VET9Z/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/87VP87/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/87VP87/", "attachments": []}, {"guid": "4eaceb5a-6b8f-5193-93a7-7b01b73776a6", "code": "3RF9DP", "id": 52958, "logo": null, "date": "2024-11-16T17:30:00+08:00", "start": "17:30", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-52958-creative-problem-solving-with-graphs", "url": "https://pretalx.com/pyconhk2024/talk/3RF9DP/", "title": "Creative Problem Solving with Graphs", "subtitle": "", "track": "Lightning \u26a1", "type": "Lightning talk", "language": "en", "abstract": "Graphs and networks are fundamental data structures that are rapidly growing in popularity with practicing engineers due to their use of simple elements like nodes and edges. Many real-world problems can be translated into graph problems, and we can use Python libraries, such as NetworkX, for creative problem-solving.\n\nTake a day-to-day example as simple as arranging desks in an office. Is there an optimal way to arrange people by organizational structure and/or proximity to their informal social network in order to facilitate a conducive workplace environment that also takes into account noise levels for at-desk meetings, etc.? If we were to model this in a graph data structure with nodes being people with different properties, and edges describing relationships, this will enable us to see things in different perspectives and to come up with some innovative solutions to this problem.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "LFY9EF", "name": "Xiao Ying", "avatar": "https://pretalx.com/media/avatars/LFY9EF_VBn02In.webp", "biography": "Xiao Ying is a data analyst with the Company Financials Metadata Management & Analytics team in Bloomberg's Data department. In this role, she works closely with product managers, data teams, and the company's engineers on data product developments. Prior to joining Bloomberg to work on Data teams in the firm's Singapore and Hong Kong offices, she worked at a venture capital firm focused on transformational deep tech like artificial intelligence, blockchain, and MedTech. She is passionate about exploring innovative tech solutions that add tangible value. She holds a bachelor\u2019s degree of science in statistics and management from the National University of Singapore.", "public_name": "Xiao Ying", "guid": "a957e1a5-23a7-5ff3-9762-10d3a42fb280", "url": "https://pretalx.com/pyconhk2024/speaker/LFY9EF/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/3RF9DP/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/3RF9DP/", "attachments": []}, {"guid": "b9580327-42f5-56ef-8f1e-ff21c98d8db4", "code": "ZR3XP3", "id": 48836, "logo": null, "date": "2024-11-16T17:35:00+08:00", "start": "17:35", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-48836-interactive-game-with-mediapipe", "url": "https://pretalx.com/pyconhk2024/talk/ZR3XP3/", "title": "Interactive game with Mediapipe", "subtitle": "", "track": "Lightning \u26a1", "type": "Lightning talk", "language": "zh-hant", "abstract": "\u6211\u54cb\u6642\u4e0d\u6642\u55ba\u5546\u5834\u5572\u6524\u4f4d\u898b\u5230\u5572\u4e92\u52d5\u904a\u6232-\u4eca\u6b21\u6703\u8b1b\u5413Python\u55ba\u5462\u5ea6\u9ede\u6a23\u8d77\u4f5c\u7528\nEveryone loves gaming - especially those with movements. In this we share how we made our interactive game and other \"teamlab\" ideas with Python tools such as Mediapipe.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "8HABKC", "name": "Judy Wong", "avatar": "https://pretalx.com/media/avatars/8HABKC_EFlR6r8.webp", "biography": "You would have seen Judy in PyconHK and open source activities in HK, many a times. As a host, though. This time she's gonna share share her works with us in this short talk, though. Yep.\n\nand supposed that's what she says on her IG:\nFun lover / mum of 2 / music lover / cosplayer / China interpreter / agile coach / cybersecurity analyst / robotics engineer\n\nWhat she does? More like a tech consultant that makes anything that doesn't have a ready-made solution in the market. For both hardware and software.", "public_name": "Judy Wong", "guid": "0f0f36cb-f0af-5d02-ae7c-f5c37fbb8f9b", "url": "https://pretalx.com/pyconhk2024/speaker/8HABKC/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/ZR3XP3/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/ZR3XP3/", "attachments": []}, {"guid": "4bf6942d-5e1b-54ea-a209-dfdb39106db6", "code": "UPTBUH", "id": 58841, "logo": null, "date": "2024-11-16T17:40:00+08:00", "start": "17:40", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-58841-how-many-iphones-does-it-take-to-ship-a-new-python-version", "url": "https://pretalx.com/pyconhk2024/talk/UPTBUH/", "title": "How many iPhones does it take to ship a new Python version?", "subtitle": "", "track": "Lightning \u26a1", "type": "Lightning talk", "language": "en", "abstract": "For people new to Python, it can be hard to grasp the difference between, say, Python 3.5 and Python 3.6. This lightning talk aims to conceptualise the effort it requires to ship a new Python version, by comparing that to the development of iPhone models.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "LJCYKL", "name": "Chan Sau Yee", "avatar": "https://pretalx.com/media/avatars/LJCYKL_3zd11kY.webp", "biography": "Based in Tokyo, Sau Yee is a practical Python practitioner with a background in Urban Engineering. She believes coding is for everyone. She previously spoke at PyCon APAC 2023.", "public_name": "Chan Sau Yee", "guid": "ec0dd8c1-d1bf-5aa6-9911-77dab7c26547", "url": "https://pretalx.com/pyconhk2024/speaker/LJCYKL/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/UPTBUH/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/UPTBUH/", "attachments": []}, {"guid": "3e7e39ad-5693-5d13-8a5a-ee2229b0c976", "code": "JC3QG3", "id": 58842, "logo": null, "date": "2024-11-16T17:45:00+08:00", "start": "17:45", "duration": "00:05", "room": "LT9", "slug": "pyconhk2024-58842-how-much-is-hsbc-now", "url": "https://pretalx.com/pyconhk2024/talk/JC3QG3/", "title": "\u532f\u8c50\u54a9\u50f9\u4f4d? / How much is HSBC now?", "subtitle": "", "track": "Lightning \u26a1", "type": "Lightning talk", "language": "zh-hant", "abstract": "Using Playwright, you can write a program to harvest the stock price of HSBC in 5 minutes' work.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "EKWAB9", "name": "Dr. Adrian Tam", "avatar": "https://pretalx.com/media/avatars/EKWAB9_ZyBo7za.webp", "biography": "Adrian has been using Python for work for more than 20 years. Although not the only programming language to use, it is his favorite for quick experiments and prototyping. His interest is in mathematical modeling, number crunching, high performance computing, and in the last decade, machine learning and AI.", "public_name": "Dr. Adrian Tam", "guid": "fc369b02-816a-5f37-9cae-1e9d18a278de", "url": "https://pretalx.com/pyconhk2024/speaker/EKWAB9/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/JC3QG3/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/JC3QG3/", "attachments": [{"title": "code", "url": "/media/pyconhk2024/submissions/JC3QG3/resources/Screenshot_202_rncycls.png", "type": "related"}]}, {"guid": "234738d6-7fa7-5f89-91e8-2459551da491", "code": "HTGZMQ", "id": 56373, "logo": "https://pretalx.com/media/pyconhk2024/submissions/HTGZMQ/logo_with_text_XHGMjJQ.gif", "date": "2024-11-16T17:55:00+08:00", "start": "17:55", "duration": "00:15", "room": "LT9", "slug": "pyconhk2024-56373-closing-remarks", "url": "https://pretalx.com/pyconhk2024/talk/HTGZMQ/", "title": "Closing remarks", "subtitle": "", "track": null, "type": "Short talk", "language": "en", "abstract": "Closing remarks and announcements", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "UZNN3F", "name": "Scotty Kwok", "avatar": "https://pretalx.com/media/avatars/UZNN3F_7kjlL0I.webp", "biography": "PyCon Hong Kong 2024 Chairman\n\nScotty Kwok is a software developer and founder of tech company. He enjoys writing software and building hardware to solve problem in his job and leisure time. He is currently working in Sebit Company Limited (www.sebit.world) as the CTO and founder, specialised in Al/computer vision. Scotty has been the speaker in several PyCons (PyCon Hong Kong 2018 & 2021 and PyCon APAC 2021) and also program committee in PyCon Hong Kong 2020,2022,2023.\n\nLinkedin:  https://www.linkedin.com/in/scottykwok/", "public_name": "Scotty Kwok", "guid": "1c8530b9-e696-54e3-9386-74fa246e223e", "url": "https://pretalx.com/pyconhk2024/speaker/UZNN3F/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/HTGZMQ/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/HTGZMQ/", "attachments": []}], "LT8": [{"guid": "fdab8ff2-5607-5f1e-8d17-1fb91f137920", "code": "LY8XCV", "id": 52838, "logo": "https://pretalx.com/media/pyconhk2024/submissions/LY8XCV/DALLE_2023-12-25_22.58.49_-_A_cute_cartoon-style_llama_in_24XhaeG.png", "date": "2024-11-16T11:10:00+08:00", "start": "11:10", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-52838-taiwan-llm-bridging-the-linguistic-divide-with-a-culturally-aligned-language-model", "url": "https://pretalx.com/pyconhk2024/talk/LY8XCV/", "title": "Taiwan LLM: Bridging the Linguistic Divide with a Culturally Aligned Language Model", "subtitle": "", "track": "LLM", "type": "Talk", "language": "en", "abstract": "[ONLINE presentation] This talk introduces TAIWAN-LLM, a pioneering Large Language Model specifically designed for Traditional Chinese as used in Taiwan. We'll discuss how TAIWAN-LLM addresses the underrepresentation of Traditional Chinese in existing language models, bridging the linguistic and cultural divide. The presentation will cover our approach to developing a culturally aligned model, including the use of a comprehensive Taiwanese corpus, instruction fine-tuning, and real user feedback incorporation. We'll share evaluation results demonstrating TAIWAN-LLM's superior performance in understanding and generating Traditional Chinese text compared to existing models.", "description": "This will be an online presentation.\nIn this presentation, we'll dive deep into the development and capabilities of TAIWAN-LLM, the first Large Language Model tailored for Traditional Chinese speakers in Taiwan. Key topics include:\n\n1. The challenge of linguistic underrepresentation in existing LLMs\n2. Our three-phase methodology: Continue-Pretraining, Supervised Fine-Tuning, and Feedback Supervised Fine-Tuning\n3. The composition and curation of our Taiwanese corpus\n4. Evaluation results on various NLP tasks, including contextual QA, summarization, and classification\n5. Real-world applications and use cases of TAIWAN-LLM\n6. The importance of culturally aligned language models for preserving linguistic diversity\n\nWe'll also discuss the open-source release of TAIWAN-LLM and its potential impact on NLP research and applications for Traditional Chinese.", "recording_license": "", "do_not_record": false, "persons": [{"code": "HKASZZ", "name": "Yenting Lin", "avatar": "https://pretalx.com/media/avatars/HKASZZ_r5lBZjO.webp", "biography": "Yen-Ting Lin is a Ph.D. candidate at National Taiwan University, advised by Professor Yun-Nung (Vivian) Chen. His research focuses on large language models (LLMs), and he is currently leading the Taiwan-LLM project, which develops language models optimized for Traditional Chinese, addressing the unique linguistic needs of Taiwan. \n\nHe has gained practical experience through internships at companies such as Meta GenAI in summer 2024, NVIDIA Research in spring 2024, Amazon Alexa AI in the summers of 2021, 2022, and 2023, MediaTek Research in the summer of 2019, and IBM Research in the summer of 2020.\n\nYen-Ting is actively seeking industry research scientist or engineer positions starting in 2025.", "public_name": "Yenting Lin", "guid": "ffacdc6c-b632-525d-a61b-6a97b34a5491", "url": "https://pretalx.com/pyconhk2024/speaker/HKASZZ/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/LY8XCV/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/LY8XCV/", "attachments": []}, {"guid": "bbbfa7ab-32c9-5cba-82a1-3256c01f7c50", "code": "K7VYAH", "id": 53872, "logo": "https://pretalx.com/media/pyconhk2024/submissions/K7VYAH/DSL-logo_EYz3d5p.png", "date": "2024-11-16T11:50:00+08:00", "start": "11:50", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-53872-hackman-iot-membership-platform-on-raspberry-pi-nix-for-hong-kong-s-first-hackerspace", "url": "https://pretalx.com/pyconhk2024/talk/K7VYAH/", "title": "Hackman: IoT & membership platform on Raspberry Pi & Nix for Hong Kong's first Hackerspace", "subtitle": "", "track": "DevOps", "type": "Talk", "language": "en", "abstract": "We build everything ourselves at Dim Sum Labs, Hong Kong's first Hackerspace. This includes Hackman, the IoT system that manages our membership and controls the space's door, lights, appliances, and electricity usage. Hackman is written in Python and runs entirely on a Raspberry Pi 5. We will bring a replica of Hackman and some attachments (we can't bring the door, though) and give a live demo. You will hear about how we use Nix, DevOps/GitOps, a staging Raspberry Pi, and software engineering practices that make it reliable. We will show how it can be easily extended using Redis.", "description": "Hackman is a Hackerspace management system for Dim Sum Labs, Hong Kong's first Hackerspace. It is a Django application running on a Raspberry Pi 5 that manages our membership, controls access to the space, and much more. It serves a critical function for our space hence it must be reliable. Our members should easily add features to it while keeping the core stable.\n\nIn this talk, we will talk about how we use various software engineering practices to make it stable and reliable while making it extensible. We'll discuss:\n\n* How the Django application is structured\n* How we use Redis as a means to easily extend the system\n* How we use Nix to make the operating system and the application easily reproducible\n* How we use DevOps/GitOps along with ample tests to manage software deployments\n\nDim Sum Labs is Hong Kong\u2019s first and longest-running Hackerspace since 2011, open to anyone interested in hacking: the intellectual challenge to creatively overcome or otherwise \u201chack\u201d the limitations, capabilities, purposes, forms, etc. of virtually anything \u2014 or in other words: to mess around and build anything for fun. The members extend this ethos to its membership management system and the IoT in the space. For more information, visit us at https://www.dimsumlabs.com/ . Hackman is open source and can be accessed at https://github.com/dimsumlabs/hackman", "recording_license": "", "do_not_record": false, "persons": [{"code": "S99Z8Y", "name": "Nigel Choi", "avatar": "https://pretalx.com/media/avatars/S99Z8Y_H2MWgiW.webp", "biography": "A lifelong dabbler, learner, and maker, Nigel is an active member of Dim Sum Labs, Hong Kong's longest running Hackerspace. Professionally, he is currently Head of Engineering at Eythos, a tech-enabled fine arts service company in Hong Kong. His varied background includes inventing and selling Chokerkeys (a macro keypad), being a consultant at McKinsey & Company, and Silicon Valley engineer at Google, Yahoo. He holds a Masters in Computer Science from Stanford University.", "public_name": "Nigel Choi", "guid": "22e40c68-a0b2-5545-bec2-292970c6f779", "url": "https://pretalx.com/pyconhk2024/speaker/S99Z8Y/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/K7VYAH/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/K7VYAH/", "attachments": []}, {"guid": "c5556075-9cad-59db-a013-c6b48bc9610c", "code": "HZAX7P", "id": 53753, "logo": "https://pretalx.com/media/pyconhk2024/submissions/HZAX7P/0262039C-19CF-42A1-AA52-178E652AD20B_1_105_c_InLTyrF.jpeg", "date": "2024-11-16T12:25:00+08:00", "start": "12:25", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-53753-hk-python-user-group", "url": "https://pretalx.com/pyconhk2024/talk/HZAX7P/", "title": "\u5982\u679cHK Python User Group\u5514\u58ef\u5927\uff0c\u9326\u9bc9\u5c31\u5927\u944a\u4e86!", "subtitle": "", "track": "Perspectives", "type": "Talk", "language": "zh-hant", "abstract": "\u4f5c\u70ba\u4e00\u500b\u591a\u5e74\u7d44\u7e54 OSC /PYCON\u7684\u4e2d\u5e74\u5927\u53d4\uff0c\u60f3\u5206\u4eab\u4e00\u4e0b\u5982\u4f55\u7d93\u71df\u672c\u5730\u793e\u5340\uff0c\u518d\u5206\u4eab\u5916\u5730\u7684\u7d93\u9a57\uff0c\u5e0c\u671b\u66f4\u591a\u4eba\u53ef\u4ee5\u53c3\u8207\u5230\uff0c\u8b93\u6211\u80fd\u6709\u6a5f\u6703\u8b8a\u56de\u4e00\u500b\u53c3\u52a0\u8005\u8eab\u4efd\u3002", "description": "\u6211\u6703\u5206\u4eab \u904e\u5f80\u8d85\u904e\u5341\u5e74 PYCON HK/ OSHK \u7684\u7d93\u9a57\uff0c\u52a0\u5de6\u8fd1\u5e74\u53c3\u52a0\u5916\u5730PYCON APAC\u4e4b\u9593\u7684\u6d3b\u52d5\uff0c\u53bb\u4e86\u89e3\u672c\u5730\u793e\u7fa4\u7684\u4e0d\u8db3\uff0c\u6709\u66f4\u591a\u4e8b\u60c5\u53ef\u4ee5\u6539\u5584\uff0c\u8b93Python User Group \u80fd\u5920\u6709\u6a5f\u5730\u6210\u9577\u3002\u5305\u62ec \u5ba3\u50b3\uff0c\u8a2d\u8a08\uff0c\u8a08\u5283\uff0c\u64cd\u4f5c\u5404\u7bc4\u7587\u3002", "recording_license": "", "do_not_record": false, "persons": [{"code": "NFGFHQ", "name": "Calvin Tsang", "avatar": "https://pretalx.com/media/avatars/NFGFHQ_PtkCOPj.webp", "biography": "Vice President of PyCon HK 2024\nFormer OC in PyCon APAC \nVice President of Open Source Hong Kong", "public_name": "Calvin Tsang", "guid": "c0b94c9b-c979-56e2-b9a8-3d81256fd42a", "url": "https://pretalx.com/pyconhk2024/speaker/NFGFHQ/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/HZAX7P/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/HZAX7P/", "attachments": []}, {"guid": "fac9191e-d58f-5428-bd64-4ef6cf7fd23a", "code": "UGFV3S", "id": 55027, "logo": null, "date": "2024-11-16T14:00:00+08:00", "start": "14:00", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-55027-numbast-bridging-the-gap-between-cuda-c-and-python", "url": "https://pretalx.com/pyconhk2024/talk/UGFV3S/", "title": "Numbast: Bridging the gap between CUDA C++ and Python", "subtitle": "", "track": "Performance", "type": "Talk", "language": "en", "abstract": "- Numba is a popular JIT compiler that translates Python code into optimized machine code for various hardware targets, and Numba-CUDA supports compilation of Python code for execution on NVIDIA devices. Whilst Numba-CUDA provides many basic accelerated programming function blocks out of the box, manually creating bindings for a CUDA device library is still laborious. \n- Numbast is an auto device binding generation tool created by NVIDIA. Numbast provides an end-to-end binding generation mechanism that quickly bridges the gap between the CUDA ecosystem and Python CUDA.\n- In this talk, attendees will learn about recent progress of accelerated computing in Python with Numba-CUDA, the internal mechanisms of Numbast, and get hands-on experience of crafting CUDA kernels in Numba-CUDA, as well as creating bindings with Numbast.\n- Additionally, we will provide an insight into how Numba is used across RAPIDS, Nvidia\u2019s accelerated computing solution that focuses on making accelerated computing more accessible to the general python community. Time permitting, we will also introduce how user-defined functions (UDF) are used in `cudf.pandas`.", "description": "See Abstract.", "recording_license": "", "do_not_record": false, "persons": [{"code": "LVFYRN", "name": "Michael Wang", "avatar": "https://pretalx.com/media/avatars/LVFYRN_kcNoZjT.webp", "biography": "Michael Yh Wang is a software engineer in Nvidia Rapids. He currently contributes his engineering skills towards cuDF, cuSpatial and Numba. Prior to Nvidia he acquired a master of science degree from Yale University. His earlier experience includes working as a visual effect supervisor at an independent film project, and achieving first place at the WAIC 2020 hackathon competition. Michael has strong interests in software engineering, computer graphics algorithms and compiler technology. He believes in a future where accelerated computing can be brought more accessible to the public via compiler and language innovations.", "public_name": "Michael Wang", "guid": "69a4eec2-7dab-50ea-9449-1ea398a31568", "url": "https://pretalx.com/pyconhk2024/speaker/LVFYRN/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/UGFV3S/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/UGFV3S/", "attachments": [{"title": "Presentation Slides", "url": "/media/pyconhk2024/submissions/UGFV3S/resources/Numbast_102824_AGSL12z.pdf", "type": "related"}]}, {"guid": "404a8b59-8993-56f5-8fec-03e651b7a880", "code": "9HHTWK", "id": 52489, "logo": null, "date": "2024-11-16T14:40:00+08:00", "start": "14:40", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-52489-operate-with-confidence-opentelemetry-in-python", "url": "https://pretalx.com/pyconhk2024/talk/9HHTWK/", "title": "Operate with Confidence -- OpenTelemetry in Python", "subtitle": "", "track": "Libraries / Tools", "type": "Talk", "language": "en", "abstract": "In this era of microservices, the '3 Pillars of  System Observability', a.k.a. **logging**, **metrics monitoring** and **traffic tracing** are pivotal in giving developers quick feedbacks on the **performance** and **behaviour** of their application. With good observability practices, not only developers can understand the bottleneck and stability of their app, they can even be benefited from faster iteration cycle due to reliable feedback loops.\n\nIn this talk, the usage of **OpenTelemetry** package, a well-known open-source Observability stack, in Python will be addressed. OpenTelemetry is a **vendor-** and **tool-agnostic**, Observability stack integrating with a broad variety of Observability backends, including open source tools like **Jaeger** and **Prometheus**, as well as commercial offerings. \n\nWith the introduction of usage of OpenTelemetry in Python, it is hoped that users have more **understanding on the '3 Pillars of System Observability'**, **actively and confidently monitor** their Python workloads, and define a **suitable and meaningful Service Level Objective (SLO)** for their program.", "description": "This talk will be broken down into following sessions:\n- Introduction: 3 Pillars of System Observability (~5 mins)\n- OpenTelemetry on Python FastAPI and AWS Lambda, with Visualizations (~15 - 20 mins)\n- Why not just Logging? (~2 mins)\n- Why not just Metrics (with Prometheus)? (~2 mins)\n- Integration with other Cloud Monitoring Platforms (~2-3 mins)", "recording_license": "", "do_not_record": false, "persons": [{"code": "3TV7ZX", "name": "Alex Au", "avatar": "https://pretalx.com/media/avatars/3TV7ZX_YYOW8lE.webp", "biography": "I am a Cloud Engineer with past experiences of production-grade ML and backend developments. In my 4 years of experience in Python, I have been working on AI / recommender system and cloud computing. I like to explore topics in AI, information retrieval and system designs in my leisure time. I also contributes to some Rust and Python Open-Source projects. In the era of Cloud and AI / ML Technologies, I would like to share efficient and cost-effective system designs to others for advancing their developments or businesses.", "public_name": "Alex Au", "guid": "1335f69e-634f-5055-994e-ec443b3d55be", "url": "https://pretalx.com/pyconhk2024/speaker/3TV7ZX/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/9HHTWK/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/9HHTWK/", "attachments": []}, {"guid": "51163268-787e-5340-81d2-6a1ab9077761", "code": "GYCVTG", "id": 53649, "logo": null, "date": "2024-11-16T15:15:00+08:00", "start": "15:15", "duration": "00:15", "room": "LT8", "slug": "pyconhk2024-53649-leveraging-multi-models-and-open-webui-to-mimic-chatgpt-with-data-security-considerations", "url": "https://pretalx.com/pyconhk2024/talk/GYCVTG/", "title": "Leveraging Multi-Models and Open WebUI to Mimic ChatGPT with Data Security Considerations", "subtitle": "", "track": "LLM", "type": "Short talk", "language": "en", "abstract": "In an era where data security and control are paramount, leveraging local and in-house AI solutions has become increasingly significant. This presentation will explore how to use Open WebUI to build on-device GPT models or in-house server-based GPT systems, offering robust alternatives to cloud-based AI solutions like Copilot, ChatGPT-4o. The focus will be on ensuring data remains local or within company control, addressing key security considerations.", "description": "The talk will cover the following aspects:\n##### 1. Introduction to Open WebUI:\n   \u25e6 Overview of Open WebUI, an extensible and feature-rich self-hosted WebUI designed to operate offline.\n   \u25e6 Discussion on its capabilities to integrate various LLM runners, including Ollama and OpenAI-compatible APIs.\n##### 2. Setting Up Open WebUI:\n   \u25e6 Step-by-step guide on installing and configuring Open WebUI using Docker or Kubernetes for seamless deployment.\n   \u25e6 Instructions on integrating GPU support for enhanced performance.\n##### 3. Multi-Model Integration:\n   \u25e6 Demonstration of how to leverage multiple models within Open WebUI, allowing for versatile and powerful interactions.\n   \u25e6 Examples of using models such as LLaVA, Llama3, Phi-3 Mini, and more for diverse applications.\n##### 4. Enhancing Functionality with Plugins:\n   \u25e6 Introduction to the Pipelines Plugin Framework to incorporate custom logic and Python libraries.\n   \u25e6 Examples of plugins for web search, document search, Discord integration, and more.\n##### 5. Data Security and Control:\n   \u25e6 Discussion on the importance of keeping data local or within company infrastructure.\n   \u25e6 Best practices for ensuring data security and compliance while using in-house AI solutions.\n##### 6. Building a Powerful Interface:\n   \u25e6 Tips on extending Open WebUI to create a user interface similar to ChatGPT-4o.\n   \u25e6 Leveraging features such as Markdown and LaTeX support, hands-free voice/video call, and retrieval-augmented generation (RAG) for a dynamic user experience.", "recording_license": "", "do_not_record": false, "persons": [{"code": "DQE737", "name": "Dr. Chung Ng", "avatar": "https://pretalx.com/media/avatars/DQE737_kWCqEpL.webp", "biography": "Dr. Chung is a SVP at Group CTO Office of the HKT/PCCW Group, where he\u2019s responsible for leading the group\u2019s product and technology roadmap and strategic development. He also represents the group as board members of Lynx Analytics and Bindo Labs.\n\nBefore HKT/PCCW, Chung contributed to the Big Data/AI strategy at Telstra as well as its international growth strategy. Prior to Telstra, Chung was an Associate Partner of Cluster Technology Limited which serves the Greater China market with professional services and solutions in high-performance computing, machine learning, big data, and public cloud.\n\nIn 2008, Chung joined McKinsey & Company in the Hong Kong office. He received his DPhil in Information Engineering from the University of Oxford and held the Croucher Foundation Scholarship to work toward his research degree in wireless ad-hoc networks. Chung also received BEng and MPhil in Information Engineering from the Chinese University of Hong Kong.", "public_name": "Dr. Chung Ng", "guid": "89b72ce6-10f6-52b5-a4fc-b39f1d13f566", "url": "https://pretalx.com/pyconhk2024/speaker/DQE737/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/GYCVTG/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/GYCVTG/", "attachments": []}, {"guid": "e140daa0-98ef-56cc-a62d-7302b1db500e", "code": "UVKEGD", "id": 52631, "logo": null, "date": "2024-11-16T16:00:00+08:00", "start": "16:00", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-52631-time-to-skip-tedious-steps-spare-efforts-with-pytorch-lightning", "url": "https://pretalx.com/pyconhk2024/talk/UVKEGD/", "title": "Time to Skip Tedious Steps - Spare Efforts with PyTorch Lightning", "subtitle": "", "track": "Libraries / Tools", "type": "Talk", "language": "en", "abstract": "With the rapid advancement in deep learning, models become super large and consume significant resources, making efficiency and simplicity more critical than ever. In this talk, we introduce PyTorch Lightning, a deep learning framework that emerges as a powerful tool that streamlines the process of building, training, and scaling models, allowing researchers and practitioners to focus on what truly matters: innovation.\n\nWe will begin with an overview of PyTorch Lightning, discussing the key benefits it offers over traditional PyTorch. We will explore how PyTorch Lightning abstracts away the boilerplate code associated with model training, making it easier to implement and experiment with complex models. Then, we walk through the process of training a ResNet in PyTorch Lightning for image classification task and explore some advanced features in PyTorch Lightning.\n\nFor those interested in revisiting the content from the talk, feel free to check out the links below:\n- GitHub Code Demo: [github/wyhwong/PyConHK2024-PyTorch-Lightning](https://github.com/wyhwong/PyConHK2024-PyTorch-Lightning)\n- Slides: [OneDrive](https://1drv.ms/p/c/7adfdf652c41fb6c/EZ-Bd0i38FJKmzw5_ZYT6UIBDWWKBVsM30SlBTa2R2Cx1A)", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "7DKPAY", "name": "Henry, Wai Yin Wong", "avatar": "https://pretalx.com/media/avatars/7DKPAY_KCTdHeE.webp", "biography": "Henry is a data scientist with 4 years of experience in Python. With broad exposure to classical and modern statistical approaches, he has been developing solutions for HVAC energy optimization, object detection and classification, predictive maintenance, physics-guided machine learning, and survival analysis. Henry has also contributed to academic research in the field of black-hole physics under the Bayesian framework.", "public_name": "Henry, Wai Yin Wong", "guid": "455b6e3c-35e8-5561-9dc3-25b43a9e2457", "url": "https://pretalx.com/pyconhk2024/speaker/7DKPAY/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/UVKEGD/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/UVKEGD/", "attachments": []}, {"guid": "1fa8f64d-1d5e-5606-aced-0e91da8d707f", "code": "WQJV7B", "id": 50952, "logo": null, "date": "2024-11-16T16:40:00+08:00", "start": "16:40", "duration": "00:30", "room": "LT8", "slug": "pyconhk2024-50952-simplifying-python-web-app-operations-automating-k8s-ops-with-open-source", "url": "https://pretalx.com/pyconhk2024/talk/WQJV7B/", "title": "Simplifying Python Web App Operations: Automating K8s Ops with Open Source", "subtitle": "", "track": "DevOps", "type": "Talk", "language": "en", "abstract": "After creating a great web app using Python such as with flask, the next hurdle to production is how to make it available to users and operate it. And not just your app, but also ingress, the database, observability and the list goes on. We will go through your options for simplifying the operations of your web app using open source tooling. This will include using k8s directly, helm charts, IaaC using pulumi and new tooling developed by Canonical using juju. By the end of the talk you will have seen the benefits and drawbacks of each which will help you make an informed decision on which tool best suits your needs!", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "NTSWYJ", "name": "YangSoo Yoon", "avatar": "https://pretalx.com/media/avatars/NTSWYJ_UPyQpsW.webp", "biography": "I am a platform developer at Canonical, working on a platform called Juju, a bootstrapped controller for both VMs and Kubernetes. I have always been an avid Python developer since his days in an AI startup to platform development.\nPlease don't hesitate to reach out to me if you have any questions!", "public_name": "YangSoo Yoon", "guid": "e247b4d3-124b-5056-a25f-980ce2200354", "url": "https://pretalx.com/pyconhk2024/speaker/NTSWYJ/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/WQJV7B/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/WQJV7B/", "attachments": []}], "LT7": [{"guid": "03965158-0ff1-51ae-8397-bb45da8ca4d5", "code": "FJLLGF", "id": 52539, "logo": null, "date": "2024-11-16T11:10:00+08:00", "start": "11:10", "duration": "00:30", "room": "LT7", "slug": "pyconhk2024-52539-pydantic-logfire-empowering-python-observability", "url": "https://pretalx.com/pyconhk2024/talk/FJLLGF/", "title": "Pydantic Logfire: Empowering Python Observability", "subtitle": "", "track": "Libraries / Tools", "type": "Talk", "language": "en", "abstract": "Pydantic Logfire is an advanced observability platform tailored for Python applications, integrating seamlessly with the popular Pydantic library. Built on the principles of simplicity and power, Pydantic Logfire offers deep insights into application behavior through Python-centric telemetry, structured logging, and powerful SQL querying capabilities. Leveraging OpenTelemetry for comprehensive instrumentation, it ensures Python developers can efficiently monitor, debug, and optimize their codebases. From small scripts to enterprise deployments, Pydantic Logfire transforms raw data into actionable insights, simplifying the observability journey for Python developers.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "XHT9ZV", "name": "Hemangi Karchalkar", "avatar": "https://pretalx.com/media/avatars/XHT9ZV_jFYFMbW.webp", "biography": "I\u2019m Hemangi Karchalkar, a senior software developer at Epam Systems, weaving Python magic for five years. By day, I\u2019m your go-to coding junkie, and by night, I moonlight as a Python mentor, adding a sprinkle of jokes to the learning mix. Multitasking is my superpower, and I firmly believe that laughter is the best debugger. In the world of brackets and semicolons, I bring a dose of humor, making coding an entertaining adventure. Join me for a Python journey where code and comedy collide, bugs are no match for wit, and mentorship comes with a side of humor.", "public_name": "Hemangi Karchalkar", "guid": "b4bb3b14-c8f1-53d1-a6cb-d5f2cd1b2635", "url": "https://pretalx.com/pyconhk2024/speaker/XHT9ZV/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/FJLLGF/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/FJLLGF/", "attachments": []}, {"guid": "83ef97e5-211e-515a-bb9e-674bb8f9523f", "code": "LNUWEC", "id": 53730, "logo": null, "date": "2024-11-16T11:50:00+08:00", "start": "11:50", "duration": "00:30", "room": "LT7", "slug": "pyconhk2024-53730-high-throughput-python", "url": "https://pretalx.com/pyconhk2024/talk/LNUWEC/", "title": "High Throughput Python", "subtitle": "", "track": "Performance", "type": "Talk", "language": "en", "abstract": "Python is infamous for its slowless and the GIL problem. In Python 3.4, asyncio was introduced to allow non-blocking I/O, and concurrent.futures was introduced for an easier syntax to write parallel code. But still, Python is not super fast. In this talk, I will show case 10+ ways of generating data in parallel in Python and compare their performance. The unfortunate conclusion is that nothing is always the best, even with the free-threaded Python of 3.13, the silver bullet does not exist.", "description": "The talk is focus on CPython and experiment is done on Apple Silicon. It is to generate numpy array of random float as an example, and later to extend into Python lists of floats. I will compare the data generation throughput amongst using multiprocessing, threading, and concurrency.futures modules in Python as well as numba and joblib external libraries. The key result is to highlight the trade off between threading vs multiprocessing, in which if you want to use multiprocessing to work around the GIL, you pay the price of inter-process communication overhead. Even with free-threaded Python in 3.13 that you can avoid the GIL, you can't find a solution that is always better.", "recording_license": "", "do_not_record": false, "persons": [{"code": "EKWAB9", "name": "Dr. Adrian Tam", "avatar": "https://pretalx.com/media/avatars/EKWAB9_ZyBo7za.webp", "biography": "Adrian has been using Python for work for more than 20 years. Although not the only programming language to use, it is his favorite for quick experiments and prototyping. His interest is in mathematical modeling, number crunching, high performance computing, and in the last decade, machine learning and AI.", "public_name": "Dr. Adrian Tam", "guid": "fc369b02-816a-5f37-9cae-1e9d18a278de", "url": "https://pretalx.com/pyconhk2024/speaker/EKWAB9/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/LNUWEC/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/LNUWEC/", "attachments": [{"title": "Presentation slides", "url": "/media/pyconhk2024/submissions/LNUWEC/resources/Parallel_0wXka3V.pdf", "type": "related"}]}, {"guid": "6bff9c3c-69cc-518f-9a9b-f3427c1abf28", "code": "CEWPVB", "id": 49762, "logo": null, "date": "2024-11-16T12:25:00+08:00", "start": "12:25", "duration": "00:30", "room": "LT7", "slug": "pyconhk2024-49762-local-llm", "url": "https://pretalx.com/pyconhk2024/talk/CEWPVB/", "title": "Local \u77e5\u8b58\u64c2\u53f0LLM\u5927\u683c\u9b25", "subtitle": "", "track": "LLM", "type": "Talk", "language": "zh-hant", "abstract": "[ONLINE presentation] In the LLM world, every one is using GPT-4 as the golden standard. Are there cases where smaller language model can outperform GPT4 in terms of its richness in language expression and wealth of local knowledge? We want to present our discovery work on evaluating a suite of LLMs in the area of Cantonese skills, Hong Kong local geography and social knowledge. \n\nWe will demo our open-sourced platform for others to play with the Cantonese, Hong Kong-specific chatbot arena as well. \u4e00\u9f4a\u9ece\u6311\u6a5f\u5566\uff01", "description": "This will be an online presentation.\nIn the LLM world, every one is using GPT-4 as the golden standard. Are there cases where smaller language model can outperform GPT4 in terms of its richness in language expression and wealth of local knowledge? We want to present our discovery work on evaluating a suite of LLMs in the area of Cantonese skills, Hong Kong local geography and social knowledge. \n\nWe will demo our open-sourced platform for others to play with the Cantonese, Hong Kong-specific chatbot arena as well. \u4e00\u9f4a\u9ece\u6311\u6a5f\u5566\uff01", "recording_license": "", "do_not_record": false, "persons": [{"code": "UXMVWE", "name": "Winnie Yeung", "avatar": "https://pretalx.com/media/avatars/UXMVWE_pdAi83r.webp", "biography": "Senior ML Engineer at Square (San Francisco Bay Area), previously at Visa and Fidelity. Specialized in LLM in production, finetuning and evaluation.", "public_name": "Winnie Yeung", "guid": "87a88349-5904-57bb-8439-1efdf2b8e496", "url": "https://pretalx.com/pyconhk2024/speaker/UXMVWE/"}, {"code": "AS7VAX", "name": "Marcus Lau", "avatar": "https://pretalx.com/media/avatars/AS7VAX_mgzxI0F.webp", "biography": ".", "public_name": "Marcus Lau", "guid": "ea8a8bb5-e7e1-51fc-9187-3a68a7e51580", "url": "https://pretalx.com/pyconhk2024/speaker/AS7VAX/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/CEWPVB/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/CEWPVB/", "attachments": []}, {"guid": "59b3ed56-8446-5a51-93ce-74273e98294b", "code": "VRPMHX", "id": 53294, "logo": null, "date": "2024-11-16T14:00:00+08:00", "start": "14:00", "duration": "00:30", "room": "LT7", "slug": "pyconhk2024-53294-how-do-i-debug-my-pyspark-workloads", "url": "https://pretalx.com/pyconhk2024/talk/VRPMHX/", "title": "How do I debug my PySpark workloads?", "subtitle": "", "track": "Libraries / Tools", "type": "Talk", "language": "en", "abstract": "PySpark is widely adopted for data analysis in distributed computing environments. It supports not only the standard DataFrame API but also Python User Defined Functions (UDFs), Python Data Sources, Python UDTFs, and more. However, debugging and profiling applications in such distributed environments are often challenging - you can't simply add a breakpoint and inspect variables in your IDE.\n\nIn this presentation, I will demonstrate effective methods for debugging and profiling PySpark applications using existing tools. These include profiling tools that utilize cProfile, a standard Python profiler, along with various tricks and best practices for monitoring and debugging PySpark applications.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "SDEGBS", "name": "Hyukjin Kwon", "avatar": "https://pretalx.com/media/avatars/SDEGBS_IcG89Gu.webp", "biography": "Hyukjin is a Databricks software engineer as the tech-lead in OSS PySpark team, ASF member, Apache Spark PMC member and committer, working on many different areas in Apache Spark such as PySpark, Spark SQL, SparkR, infrastructure, etc. He is the top contributor in Apache Spark, and leads efforts such as Project Zen, Pandas API on Spark, and Python Spark Connect.", "public_name": "Hyukjin Kwon", "guid": "cedc5d4e-945d-5701-9559-c2a01cbfd021", "url": "https://pretalx.com/pyconhk2024/speaker/SDEGBS/"}, {"code": "AL7NR3", "name": "Allison Wang", "avatar": "https://pretalx.com/media/avatars/AL7NR3_s9DinJe.webp", "biography": "Allison is a software engineer at Databricks, working on Spark SQL and PySpark. She holds a Bachelor\u2019s degree in Computer Science from Carnegie Mellon University.", "public_name": "Allison Wang", "guid": "2d16209d-0ab4-5473-ada4-79161d8014b7", "url": "https://pretalx.com/pyconhk2024/speaker/AL7NR3/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/VRPMHX/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/VRPMHX/", "attachments": []}, {"guid": "f12db578-e1e2-5a51-b83a-5839f4a5300e", "code": "KZPSVD", "id": 50215, "logo": null, "date": "2024-11-16T14:40:00+08:00", "start": "14:40", "duration": "00:30", "room": "LT7", "slug": "pyconhk2024-50215-spark-less-local-data-stack-in-2024", "url": "https://pretalx.com/pyconhk2024/talk/KZPSVD/", "title": "Spark-less local data stack in 2024", "subtitle": "", "track": "Libraries / Tools", "type": "Talk", "language": "en", "abstract": "In 2024, the Composable Data Stack is getting more mature and it's only getting easier to mix tools for different use cases. The capabilities of local data stacks continue to grow with advancements in tools like Polars and DuckDB, the necessity of using Spark for end users is increasingly being questioned. \n\nTraditionally, Spark has been regarded as the most mature and reliable data processing framework, making it a default choice for many. However, the landscape has evolved significantly by 2024, with numerous libraries now offering more efficient and versatile local data processing solutions.\n\nThis presentation will explore these new alternatives, focusing on:\n\nSQLFrame: A framework providing a Spark DataFrame API that can interface with different computing engines.\nIbis: A unified API that seamlessly integrates dataframes and databases, eliminating the need to commit to a single engine.\nSQLGlot: A powerful tool for transpiling SQL queries between different dialects, enhancing compatibility and flexibility.\nOur goal is not to declare the obsolescence of Spark but to highlight efficient alternatives that may be better suited for specific environments and use cases. Attendees will gain insights into how these modern tools can be leveraged to optimize their local data processing workflows, potentially reducing the need for Spark in certain scenarios.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "WAGCJE", "name": "Nok Lam Chan", "avatar": "https://pretalx.com/media/avatars/WAGCJE_4gSSJ5p.webp", "biography": "I am a recovering data scientist, currently working as a software engineer for an open source project called Kedro (https://github.com/kedro-org/kedro) in London. I am passionate about open source and machine learning. In my free time, I like playing badminton.", "public_name": "Nok Lam Chan", "guid": "5699fff4-11b8-5aaf-8929-290ec7951fe3", "url": "https://pretalx.com/pyconhk2024/speaker/WAGCJE/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/KZPSVD/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/KZPSVD/", "attachments": []}, {"guid": "ae71d2da-8993-5250-b71d-cd8cc3b974f0", "code": "BHXJZA", "id": 52735, "logo": null, "date": "2024-11-16T15:15:00+08:00", "start": "15:15", "duration": "00:15", "room": "LT7", "slug": "pyconhk2024-52735-power-pytorch-training-with-centralized-ai-data-lake-and-advanced-data-selection-techniques", "url": "https://pretalx.com/pyconhk2024/talk/BHXJZA/", "title": "Power PyTorch Training with Centralized AI Data Lake and Advanced Data Selection Techniques", "subtitle": "", "track": "Libraries / Tools", "type": "Short talk", "language": "en", "abstract": "AI data is often stored in separate silos: databases, parquets/ORC files in cloud storage, and embeddings in vector databases, creating complexities in data management. \n\nTo address the above issue, the Lance columnar format is specifically designed for multimodal AI. It has unique combination of capabilities including fast scan and point query, storing large blobs inline, and zero-cost schema evolutions, enabling the creation of a centralized, massive-scale, all-in-one data lake that can store all kinds of AI data\u2014structured, unstructured, and embeddings\u2014in one cohesive dataset.\n\nLance-Pytorch Dataset utilizes Lance\u2019s embedded query engine. Written in Rust, it can quickly identify the most relevant and useful data for training without ever materializing such datasets using external systems. PyTorch training can leverage this unified data lake to seamlessly access and train from all data types, facilitating the creation of high-quality models.\n\nThis approach allows organizations to train or fine-tune foundation models that encompass comprehensive organizational knowledge, and significantly accelerates the training process while maintaining model quality.", "description": "", "recording_license": "", "do_not_record": false, "persons": [{"code": "3PGYXL", "name": "Yang Cen", "avatar": "https://pretalx.com/media/avatars/3PGYXL_GAbf8qA.webp", "biography": "I'm now a senior software engineer at LanceDB, and working on building the efficient open source columnar Lance format, vector search algorithms and database for AI. I have strong passion for the open source community, and contribute to multiple open source projects like Lance, Golang, Milvus, Arrow, etc.\n\nI'm focusing on vector searching, to make model inference / similarity searching more efficient and accurate.", "public_name": "Yang Cen", "guid": "9f5d576b-8b65-543a-8d02-eadcfd7acf7f", "url": "https://pretalx.com/pyconhk2024/speaker/3PGYXL/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/BHXJZA/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/BHXJZA/", "attachments": []}, {"guid": "a00cd972-a0a8-5c04-a8d7-2dba303dcf82", "code": "X9UZSA", "id": 52103, "logo": "https://pretalx.com/media/pyconhk2024/submissions/X9UZSA/Gemini_Pro_Vision_AI_Screen_Reader_Cover_4vOJl1M.png", "date": "2024-11-16T16:00:00+08:00", "start": "16:00", "duration": "00:30", "room": "LT7", "slug": "pyconhk2024-52103-enhancing-web-image-accessibility-for-visually-impaired-individuals-with-gemini-pro-vision-and-google-cloud-platform", "url": "https://pretalx.com/pyconhk2024/talk/X9UZSA/", "title": "Enhancing Web Image Accessibility for Visually Impaired Individuals with Gemini Pro Vision and Google Cloud Platform", "subtitle": "", "track": "LLM", "type": "Talk", "language": "zh-hant", "abstract": "# Background\nThe inability of visually impaired individuals access image information due to the lack of adherence to W3C web accessibility initiatives by websites. Currently, about 60% of websites lack meaningful alternate text for their images. Moreover, it is unfeasible to retroactively add descriptive text to all existing websites manually.", "description": "# GeProVis AI Screen Reader\nGeProVis is an abbreviated term for Gemini Pro Vision, and my students have significantly enhanced the conventional Google ChromeVox Screen Reader by incorporating the robust capabilities of Google Gemini Pro Vision. This blog post will focus on the details of Google Cloud Platform (GCP). In brief, ChromeVox can extract the image source url and send it to GCP.\n\nIn this talk, we will explain the technical details of the Python Google Cloud Function in this project.\n\n### Tech Blog\nhttps://medium.com/google-developer-experts/enhancing-web-image-accessibility-for-visually-impaired-individuals-with-gemini-pro-vision-and-07190b97fc38\n\n### Story\nhttps://medium.com/google-developer-experts/hkiit-students-use-gemini-pro-vision-to-develop-ai-screen-reader-acace2a0f830\n\nHong Kong Google Cloud Summit 2024 GeProVis AI Screen Reader MD and GM, Google Hong Kong Michael Yue\nhttps://youtu.be/VqSYB62xrz8\n\n### Awards \n- City I&T Grand Challenge 2024 - Innovation Award \n- Google GDSC 2024 Solution Challenge Global Top 100\n\n### Speakers:\nCyrus Wong - AWS ML Hero + Microsoft MVP - Azure AI + Google Developer Experts - GCP & AI/ML(GenAI)\nhttps://www.linkedin.com/in/cyruswong/\n\nHin Pak Markus Tsang (\u66fe\u61b2\u67cf) - HKIIT \u96f2\u7aef\u7cfb\u7d71\u53ca\u6578\u64da\u4e2d\u5fc3\u7ba1\u7406\u9ad8\u7d1a\u6587\u6191\u8ab2\u7a0b\nhttps://www.linkedin.com/in/hin-pak-markus-tsang-%E6%9B%BE%E6%86%B2%E6%9F%8F-327949b8/ \n\nKelvin Yiu - AWS Cloud Club Captain & HKIIT \u96f2\u7aef\u7cfb\u7d71\u53ca\u6578\u64da\u4e2d\u5fc3\u7ba1\u7406\u9ad8\u7d1a\u6587\u6191\u8ab2\u7a0b\nhttps://www.linkedin.com/in/kelvin-yiu-9a25b1290/", "recording_license": "", "do_not_record": false, "persons": [{"code": "KMA9WU", "name": "Cyrus Wong", "avatar": "https://pretalx.com/media/avatars/KMA9WU_HDxnq4h.webp", "biography": "\u9ec3\u4fca\u5f65\u662f\u9999\u6e2f\u9999\u6e2f\u8cc7\u8a0a\u79d1\u6280\u5b78\u9662(HKIIT)\u4f4d\u65bc IVE(\u674e\u60e0\u5229)\u8cc7\u8a0a\u79d1\u6280\u7cfb\u96f2\u7aef\u7cfb\u7d71\u53ca\u6578\u64da\u4e2d\u5fc3\u7ba1\u7406\u9ad8\u7d1a\u6587\u6191\u7684\u9ad8\u7d1a\u8b1b\u5e2b\uff0c\u64c1\u6709\u8c50\u5bcc\u7684\u77e5\u8b58\u548c\u5c08\u696d\u6280\u80fd\u3002\u4ed6\u71b1\u8877\u65bc\u5728\u5404\u7a2e\u5a92\u9ad4\u548c\u6d3b\u52d5\u4e2d\u63a8\u5ee3\u96f2\u7aef\u6280\u8853\u3002\u7531\u65bc\u4ed6\u7684\u5c08\u696d\u77e5\u8b58\u548c\u5c08\u696d\u6280\u80fd\uff0c\u4ed6\u7372\u5f97\u4e9e\u99ac\u905c\u96f2\u7aef\u904b\u7b97\u670d\u52d9AI\u82f1\u96c4\u3001\u5fae\u8edfAzure AI\u6700\u6709\u50f9\u503c\u5c08\u5bb6\u548cGoogle\u96f2\u7aef\u5e73\u53f0& AI/ML (GenAI)\u7684Google\u958b\u767c\u8005\u5c08\u5bb6\u7b49\u8457\u540d\u69ae\u8b7d\u7a31\u865f\uff0c\u662f\u4e16\u4e0a\u552f\u4e00\u80fd\u5920\u7372\u5f97IT\u696d\u754c\u4e09\u5de8\u982d\u540c\u6642\u516c\u8a8d\u7684\u5c08\u5bb6\u3002\nCyrus Wong is an accomplished senior lecturer who oversees the Higher Diploma program in Cloud and Data Centre Administration at the Hong Kong Institute of Information Technology (HKIIT) at IVE(Lee Wai Lee) in Hong Kong. He is a passionate advocate for the adoption of cloud technology across various media and events. With his extensive knowledge and expertise, he has earned prestigious recognitions such as AWS AI Hero, Microsoft MVP - Azure AI, and Google Developer Expert for Google Cloud Platform & AI/ML (GenAI).", "public_name": "Cyrus Wong", "guid": "2980312c-d7d3-5cc1-b08b-474949baaa1a", "url": "https://pretalx.com/pyconhk2024/speaker/KMA9WU/"}, {"code": "LDPPFM", "name": "Markus Tsang", "avatar": "https://pretalx.com/media/avatars/LDPPFM_YiRQpxe.webp", "biography": "Student studying cloud and data centre administration @HKIIT -IVE(LWL)", "public_name": "Markus Tsang", "guid": "1592474b-1dd4-55f6-9b85-0bebe2718ff5", "url": "https://pretalx.com/pyconhk2024/speaker/LDPPFM/"}, {"code": "CRLC8J", "name": "YIU Kelvin", "avatar": "https://pretalx.com/media/avatars/CRLC8J_81eVV8g.webp", "biography": "I am a tech enthusiast with hands-on experience in developing with Python and Golang, working on several cloud projects. Furthermore, I have a cybersecurity background and led a team to participate in numerous public cybersecurity competitions in Hong Kong during my high school studies.", "public_name": "YIU Kelvin", "guid": "c985f059-19c3-5b83-8a32-c699a7126973", "url": "https://pretalx.com/pyconhk2024/speaker/CRLC8J/"}], "links": [], "feedback_url": "https://pretalx.com/pyconhk2024/talk/X9UZSA/feedback/", "origin_url": "https://pretalx.com/pyconhk2024/talk/X9UZSA/", "attachments": []}]}}, {"index": 2, "date": "2024-11-17", "day_start": "2024-11-17T04:00:00+08:00", "day_end": "2024-11-18T03:59:00+08:00", "rooms": {}}]}}}