Ran: wget --mirror --convert-links --adjust-extension --page-requisites --no-parent https://2024.fossy.us/
283 lines
9.9 KiB
HTML
283 lines
9.9 KiB
HTML
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<!DOCTYPE html>
|
||
|
||
<html lang="en">
|
||
<head>
|
||
<meta charset="utf-8">
|
||
<meta http-equiv="X-UA-Compatible" content="IE=edge">
|
||
<meta name="description" content="">
|
||
<meta name="viewport" content="width=device-width, initial-scale=1">
|
||
|
||
<title>FOSSY 2024 | Presentation: Getting ML Right in a Complex Data World</title>
|
||
|
||
<meta property="og:type" content="website" />
|
||
|
||
<link rel="icon" href="../../../static/build/img/favicon.ico" />
|
||
|
||
<!-- Cards -->
|
||
<meta property="og:title" content="FOSSY 2024 | Presentation: Getting ML Right in a Complex Data World">
|
||
<meta property="og:description" content="" />
|
||
<meta property="og:url" content="https://2024.fossy.us/schedule/presentation/237/">
|
||
<meta name="twitter:site" content="@conservancy">
|
||
<meta name="twitter:image:alt" content="FOSSY 2024 | Presentation: Getting ML Right in a Complex Data World" />
|
||
<meta name="twitter:card" content="summary">
|
||
<meta name="twitter:image" content="https://2024.fossy.us/static/build/img/conservancy_logo_tall_mono.png" />
|
||
<meta property="og:image" content="https://2024.fossy.us/static/build/img/conservancy_logo_tall_mono.png" />
|
||
<meta property="og:image:width" content="400" />
|
||
<meta property="og:image:height" content="400" />
|
||
|
||
|
||
<link rel="stylesheet" href="https://use.fontawesome.com/releases/v5.6.3/css/all.css" integrity="sha384-UHRtZLI+pbxtHCWp1t77Bi1L4ZtiqrqD80Kn4Z8NTSRyMA2Fd33n5dQ8lWUE00s/" crossorigin="anonymous">
|
||
<link rel="stylesheet" href="https://unpkg.com/tachyons@4.12.0/css/tachyons.min.css">
|
||
<link href="../../../static/build/scss/app.css" rel="stylesheet" type="text/css" />
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<script type="text/javascript">
|
||
var CONF_TZ = "US/Pacific";
|
||
</script>
|
||
</head>
|
||
<body class="">
|
||
|
||
<header class="clearfix d-print-none">
|
||
|
||
|
||
|
||
|
||
<nav class="navbar navbar-expand-lg navbar-dark" style="background: rgb(19,119,82); background: linear-gradient(124deg, rgba(19,119,82,1) 0%, rgba(19,106,119,1) 100%); margin-bottom: 1rem">
|
||
<div class="container">
|
||
<h2 class="sans-serif f2 f1-ns b lh-solid tracked-tight mv0 mr3">
|
||
<a class="washed-yellow hover-washed-yellow" href="../../../index.html" style="text-decoration: none">
|
||
FOSSY 2024
|
||
</a>
|
||
</h2>
|
||
|
||
<button class="navbar-toggler" type="button" data-toggle="collapse" data-target="#navbarText" aria-controls="navbarText" aria-expanded="false" aria-label="Toggle navigation">
|
||
<span class="navbar-toggler-icon"></span>
|
||
</button>
|
||
|
||
|
||
|
||
<div class="collapse navbar-collapse" id="navbarText">
|
||
<ul class="navbar-nav mr-auto">
|
||
|
||
<li class="nav-item dropdown">
|
||
|
||
<a class="nav-link dropdown-toggle" href="index.html#" data-toggle="dropdown" aria-haspopup="true" aria-expanded="false">
|
||
About
|
||
</a>
|
||
<div class="dropdown-menu">
|
||
|
||
|
||
|
||
<a class="dropdown-item " href="../../../about/index.html">About FOSSY</a>
|
||
|
||
</div>
|
||
|
||
</li>
|
||
|
||
<li class="nav-item dropdown">
|
||
|
||
<a class="nav-link dropdown-toggle" href="index.html#" data-toggle="dropdown" aria-haspopup="true" aria-expanded="false">
|
||
Attend
|
||
</a>
|
||
<div class="dropdown-menu">
|
||
|
||
|
||
|
||
<a class="dropdown-item " href="../../../dashboard.html">Dashboard</a>
|
||
|
||
<a class="dropdown-item " href="../../../attend/tickets/index.html">Tickets</a>
|
||
|
||
<a class="dropdown-item " href="../../../travel/index.html">Travel and Lodging</a>
|
||
|
||
<a class="dropdown-item " href="../../../attend/volunteer/index.html">Volunteer</a>
|
||
|
||
<a class="dropdown-item " href="../../../events/index.html">Events</a>
|
||
|
||
<a class="dropdown-item " href="../../../attend/code-of-conduct.html">Code of Conduct</a>
|
||
|
||
<a class="dropdown-item " href="../../../attend/health-and-safety/index.html">Health and Safety</a>
|
||
|
||
<a class="dropdown-item " href="../../../attend/terms-and-conditions/index.html">Terms and Conditions</a>
|
||
|
||
<a class="dropdown-item " href="https://sfconservancy.org/privacy-policy/">Privacy policy</a>
|
||
|
||
</div>
|
||
|
||
</li>
|
||
|
||
<li class="nav-item dropdown">
|
||
|
||
<a class="nav-link dropdown-toggle" href="index.html#" data-toggle="dropdown" aria-haspopup="true" aria-expanded="false">
|
||
Program
|
||
</a>
|
||
<div class="dropdown-menu">
|
||
|
||
|
||
|
||
<a class="dropdown-item " href="../../index.html">Schedule</a>
|
||
|
||
<a class="dropdown-item " href="../../../pages/tracks/index.html">Tracks</a>
|
||
|
||
</div>
|
||
|
||
</li>
|
||
|
||
<li class="nav-item ">
|
||
|
||
<a class="nav-link" href="../../../sponsorship/index.html">
|
||
Sponsorship
|
||
</a>
|
||
|
||
</li>
|
||
|
||
</ul>
|
||
</div>
|
||
</div>
|
||
</nav>
|
||
|
||
</header>
|
||
|
||
|
||
|
||
<main role="main" class="container">
|
||
<div class="row">
|
||
<div class="col page-header">
|
||
<h1 class="page-title">Getting ML Right in a Complex Data World</h1>
|
||
<p class="lead">
|
||
|
||
338 | <span class="presentation-time" data-starttime="2024-08-04T11:45:00" data-endtime="2024-08-04T12:30:00">Sun 04 Aug 11:45 a.m.–12:30 p.m.</span>
|
||
|
||
</p>
|
||
</div>
|
||
</div>
|
||
|
||
|
||
|
||
<div class="row">
|
||
<div class="col-md-12">
|
||
|
||
|
||
</div>
|
||
</div>
|
||
|
||
|
||
|
||
<div class="row presentation-details">
|
||
<div class="col-md-3">
|
||
<h2 class="mt-4">Presented by</h4>
|
||
<ul class="list-unstyled">
|
||
|
||
<li class="mb-4 pb-2">
|
||
|
||
<img src="https://secure.gravatar.com/avatar/072c0f7292a2051d29ecfef3851df888?s=120&d=mp" alt="Oz Katz" class="rounded-circle img-fluid">
|
||
<p>
|
||
<strong><a href="../../../speaker/profile/343/index.html">Oz Katz</a></strong><br />
|
||
|
||
<a href="https://twitter.com/ozkatz100">@ozkatz100</a><br />
|
||
|
||
|
||
<a href="https://lakefs.io">https://lakefs.io</a>
|
||
|
||
</p>
|
||
<div class="bio">Oz Katz is the Co-Creator of the open source lakeFS Project, an open source platform that delivers resilience and manageability to object-storage based data lakes, as well as the CTO and co-founder of Treeverse, the company behind lakeFS. Oz engineered and maintained petabyte-scale data infrastructure at analytics giant SmilarWeb, which he joined after the acquisition of Swayy.</div>
|
||
</p>
|
||
</li>
|
||
|
||
</ul>
|
||
</div>
|
||
|
||
<div class="col-md-9 presentation-abstract">
|
||
<h2 class="mt-4">Abstract</h4>
|
||
|
||
<div class="abstract pb-4"><p>Machine learning workflows are iterative & repetitive to and from multiple steps including data labeling, data cleaning, preprocessing and feature selection methods during model training, just to arrive at an accurate model.
|
||
|
||
Quality ML at scale is only possible when we can reproduce a specific iteration of the ML experiment–and this is where data is key. This means: capturing the version of training data, ML code and model artifacts at each iteration is mandatory. However, to efficiently version ML experiments without duplicating code, data and models, data versioning tools are required. Open source tools like lakeFS make it possible to version all components of ML experiments without the need to keep multiple copies, and as an added benefit, save you storage costs as well.
|
||
|
||
In this talk, you will learn how to use a data versioning engine to intuitively and easily version your ML experiments and reproduce any specific iteration of the experiment.
|
||
|
||
This talk will demo through a live code example:
|
||
• Creating a basic ML experimentation framework with lakeFS (on Jupyter notebook)
|
||
• Reproducing ML components from a specific iteration of an experiment
|
||
• Building intuitive, zero-maintenance experiments infrastructure
|
||
|
||
All with common OSS data engineering stacks & open source tooling.</p></div>
|
||
|
||
|
||
|
||
</div>
|
||
</div>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
<script src="https://code.jquery.com/jquery-3.5.1.min.js" integrity="sha256-9/aliU8dGd2tb6OSsuzixeV4y/faTqgFtohetphbbj0=" crossorigin="anonymous"></script>
|
||
<script src="../../../static/build/js/app.js" type="text/javascript"></script>
|
||
<script src="../../../static/build/js/jquery.formset.js"></script>
|
||
<script src="https://cdnjs.cloudflare.com/ajax/libs/popper.js/1.12.9/umd/popper.min.js" integrity="sha384-ApNbgh9B+Y1QKtv3Rn7W3mgPxhU9K/ScQsAP7hUibX39j7fakFPskvXusvfa0b4Q" crossorigin="anonymous"></script>
|
||
<script src="../../../static/build/bootstrap/js/bootstrap.bundle.min.js"></script>
|
||
|
||
<!--no-analytics-->
|
||
|
||
|
||
<script src="../../../static/build/js/luxon.min.js"></script>
|
||
<script src="../../../static/build/js/schedule.js" type="text/javascript"></script>
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
|
||
</main>
|
||
|
||
<footer class="footer mt-4 d-print-none">
|
||
<div class="container py-4">
|
||
<!-- <div class="row">
|
||
<div class="col-md-12 pb-12 text-center" style="margin-top: 0px;margin-bottom: 0px;border-bottom-style: solid;border-bottom-width: 0px;padding-bottom: 20px;">Wifi: FOSSY <i>(see Registration for older wifi)</i><br/>PIN: outreachy1000</div>
|
||
</div> -->
|
||
<div class="row">
|
||
<div class="col-md-4 pb-4">
|
||
<strong>FOSSY 2024</strong> <br>
|
||
August 1–4th 2024 <br>
|
||
Portland, OR<br>
|
||
Timezone: PDT - UTC-7 <br>
|
||
<a href="mailto:conference@sfconservancy.org" alt="Email"><i class="far fa-envelope"></i></a> <a
|
||
href="https://twitter.com/conservancy" alt="Twitter"><i class="fab fa-twitter"></i></a> <a
|
||
href="https://social.sfconservancy.org/conservancy" alt="Mastodon"><i class="fab fa-mastodon"></i></a>
|
||
</div>
|
||
<div class="col-md-4 pb-4 text-center">
|
||
<a href="https://sfconservancy.org"><img src="../../../static/build/img/conservancy_logo.svg" alt="Software Freedom Conservancy logo" class="footer-image"></a>
|
||
</div>
|
||
<div class="col-md-4 pb-4 text-right">
|
||
<small>
|
||
<a href="index.html#">Back to top</a><br>
|
||
© 2024 <a href="https://sfconservancy.org/">Software Freedom Conservancy</a><br>
|
||
<a href="../../../credits/index.html">Credits</a>
|
||
</small>
|
||
</div>
|
||
</div>
|
||
</div>
|
||
</footer>
|
||
|
||
</body>
|
||
</html>
|