BibTeX records: Steven Euijong Whang

download as .bib file

@article{DBLP:journals/pvldb/TaeZPRW24,
  author       = {Ki Hyun Tae and
                  Hantian Zhang and
                  Jaeyoung Park and
                  Kexin Rong and
                  Steven Euijong Whang},
  title        = {Falcon: Fair Active Learning using Multi-armed Bandits},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {17},
  number       = {5},
  pages        = {952--965},
  year         = {2024},
  url          = {https://www.vldb.org/pvldb/vol17/p952-whang.pdf},
  timestamp    = {Tue, 26 Mar 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pvldb/TaeZPRW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/KimHW24,
  author       = {Minsu Kim and
                  Seonghyeon Hwang and
                  Steven Euijong Whang},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Quilt: Robust Data Segment Selection against Concept Drifts},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {21249--21257},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i19.30119},
  doi          = {10.1609/AAAI.V38I19.30119},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/KimHW24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2401-12722,
  author       = {Ki Hyun Tae and
                  Hantian Zhang and
                  Jaeyoung Park and
                  Kexin Rong and
                  Steven Euijong Whang},
  title        = {Falcon: Fair Active Learning using Multi-armed Bandits},
  journal      = {CoRR},
  volume       = {abs/2401.12722},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2401.12722},
  doi          = {10.48550/ARXIV.2401.12722},
  eprinttype    = {arXiv},
  eprint       = {2401.12722},
  timestamp    = {Mon, 05 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2401-12722.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2402-04644,
  author       = {Yuji Roh and
                  Qingyun Liu and
                  Huan Gui and
                  Zhe Yuan and
                  Yujin Tang and
                  Steven Euijong Whang and
                  Liang Liu and
                  Shuchao Bi and
                  Lichan Hong and
                  Ed H. Chi and
                  Zhe Zhao},
  title        = {{LEVI:} Generalizable Fine-tuning via Layer-wise Ensemble of Different
                  Views},
  journal      = {CoRR},
  volume       = {abs/2402.04644},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2402.04644},
  doi          = {10.48550/ARXIV.2402.04644},
  eprinttype    = {arXiv},
  eprint       = {2402.04644},
  timestamp    = {Wed, 14 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2402-04644.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-05266,
  author       = {Jio Oh and
                  Soyeon Kim and
                  Junseok Seo and
                  Jindong Wang and
                  Ruochen Xu and
                  Xing Xie and
                  Steven Euijong Whang},
  title        = {ERBench: An Entity-Relationship based Automatically Verifiable Hallucination
                  Benchmark for Large Language Models},
  journal      = {CoRR},
  volume       = {abs/2403.05266},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.05266},
  doi          = {10.48550/ARXIV.2403.05266},
  eprinttype    = {arXiv},
  eprint       = {2403.05266},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-05266.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pacmmod/ZhangTPCW23,
  author       = {Hantian Zhang and
                  Ki Hyun Tae and
                  Jaeyoung Park and
                  Xu Chu and
                  Steven Euijong Whang},
  title        = {iFlipper: Label Flipping for Individual Fairness},
  journal      = {Proc. {ACM} Manag. Data},
  volume       = {1},
  number       = {1},
  pages        = {8:1--8:26},
  year         = {2023},
  url          = {https://doi.org/10.1145/3588688},
  doi          = {10.1145/3588688},
  timestamp    = {Wed, 06 Dec 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/pacmmod/ZhangTPCW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/Koutrika023f,
  author       = {Georgia Koutrika and
                  Jun Yang and
                  Manos Athanassoulis and
                  Kostas Stefanidis and
                  Ju Fan and
                  Abdul Quamar and
                  Yuanyan Tian and
                  Alekh Jindal and
                  Carsten Binnig and
                  Jennie Rogers and
                  Senjuti Basu Roy and
                  Steven Euijong Whang and
                  Matthias Boehm and
                  Aaron J. Elmore and
                  Vasilis Efthymiou and
                  Xiao Hu and
                  Xiaofang Zhou and
                  Alan D. Fekete},
  title        = {Front Matter},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {16},
  number       = {12},
  year         = {2023},
  url          = {https://www.vldb.org/pvldb/vol16/FrontMatterVol16No12.pdf},
  timestamp    = {Mon, 23 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/Koutrika023f.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/vldb/WhangRSL23,
  author       = {Steven Euijong Whang and
                  Yuji Roh and
                  Hwanjun Song and
                  Jae{-}Gil Lee},
  title        = {Data collection and quality challenges in deep learning: a data-centric
                  {AI} perspective},
  journal      = {{VLDB} J.},
  volume       = {32},
  number       = {4},
  pages        = {791--813},
  year         = {2023},
  url          = {https://doi.org/10.1007/s00778-022-00775-9},
  doi          = {10.1007/S00778-022-00775-9},
  timestamp    = {Thu, 15 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/vldb/WhangRSL23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HwangW23,
  author       = {Hyunseung Hwang and
                  Steven Euijong Whang},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {XClusters: Explainability-First Clustering},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {7962--7970},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i7.25963},
  doi          = {10.1609/AAAI.V37I7.25963},
  timestamp    = {Mon, 04 Sep 2023 12:29:24 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HwangW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/HeoW23,
  author       = {Geon Heo and
                  Steven Euijong Whang},
  editor       = {Brian Williams and
                  Yiling Chen and
                  Jennifer Neville},
  title        = {Redactor: {A} Data-Centric and Individualized Defense against Inference
                  Attacks},
  booktitle    = {Thirty-Seventh {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2023, Thirty-Fifth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2023, Thirteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2023, Washington, DC, USA, February
                  7-14, 2023},
  pages        = {14874--14882},
  publisher    = {{AAAI} Press},
  year         = {2023},
  url          = {https://doi.org/10.1609/aaai.v37i12.26737},
  doi          = {10.1609/AAAI.V37I12.26737},
  timestamp    = {Mon, 04 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/HeoW23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/Roh0WS23,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Euijong Whang and
                  Changho Suh},
  editor       = {Andreas Krause and
                  Emma Brunskill and
                  Kyunghyun Cho and
                  Barbara Engelhardt and
                  Sivan Sabato and
                  Jonathan Scarlett},
  title        = {Improving Fair Training under Correlation Shifts},
  booktitle    = {International Conference on Machine Learning, {ICML} 2023, 23-29 July
                  2023, Honolulu, Hawaii, {USA}},
  series       = {Proceedings of Machine Learning Research},
  volume       = {202},
  pages        = {29179--29209},
  publisher    = {{PMLR}},
  year         = {2023},
  url          = {https://proceedings.mlr.press/v202/roh23a.html},
  timestamp    = {Mon, 28 Aug 2023 17:23:08 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/Roh0WS23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2302-02323,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Euijong Whang and
                  Changho Suh},
  title        = {Improving Fair Training under Correlation Shifts},
  journal      = {CoRR},
  volume       = {abs/2302.02323},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2302.02323},
  doi          = {10.48550/ARXIV.2302.02323},
  eprinttype    = {arXiv},
  eprint       = {2302.02323},
  timestamp    = {Fri, 10 Feb 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2302-02323.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2305-15165,
  author       = {Geon Heo and
                  Junseok Seo and
                  Steven Euijong Whang},
  title        = {Personalized {DP-SGD} using Sampling Mechanisms},
  journal      = {CoRR},
  volume       = {abs/2305.15165},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2305.15165},
  doi          = {10.48550/ARXIV.2305.15165},
  eprinttype    = {arXiv},
  eprint       = {2305.15165},
  timestamp    = {Tue, 06 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2305-15165.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2312-09691,
  author       = {Minsu Kim and
                  Seonghyeon Hwang and
                  Steven Euijong Whang},
  title        = {Quilt: Robust Data Segment Selection against Concept Drifts},
  journal      = {CoRR},
  volume       = {abs/2312.09691},
  year         = {2023},
  url          = {https://doi.org/10.48550/arXiv.2312.09691},
  doi          = {10.48550/ARXIV.2312.09691},
  eprinttype    = {arXiv},
  eprint       = {2312.09691},
  timestamp    = {Tue, 09 Jan 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2312-09691.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2202-02902,
  author       = {Geon Heo and
                  Steven Euijong Whang},
  title        = {Redactor: Targeted Disinformation Generation using Probabilistic Decision
                  Boundaries},
  journal      = {CoRR},
  volume       = {abs/2202.02902},
  year         = {2022},
  url          = {https://arxiv.org/abs/2202.02902},
  eprinttype    = {arXiv},
  eprint       = {2202.02902},
  timestamp    = {Wed, 09 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2202-02902.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-07047,
  author       = {Hantian Zhang and
                  Ki Hyun Tae and
                  Jaeyoung Park and
                  Xu Chu and
                  Steven Euijong Whang},
  title        = {iFlipper: Label Flipping for Individual Fairness},
  journal      = {CoRR},
  volume       = {abs/2209.07047},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.07047},
  doi          = {10.48550/ARXIV.2209.07047},
  eprinttype    = {arXiv},
  eprint       = {2209.07047},
  timestamp    = {Thu, 01 Feb 2024 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-07047.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2209-10956,
  author       = {Hyunseung Hwang and
                  Steven Euijong Whang},
  title        = {XClusters: Explainability-first Clustering},
  journal      = {CoRR},
  volume       = {abs/2209.10956},
  year         = {2022},
  url          = {https://doi.org/10.48550/arXiv.2209.10956},
  doi          = {10.48550/ARXIV.2209.10956},
  eprinttype    = {arXiv},
  eprint       = {2209.10956},
  timestamp    = {Wed, 28 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2209-10956.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/debu/WhangTRH21,
  author       = {Steven Euijong Whang and
                  Ki Hyun Tae and
                  Yuji Roh and
                  Geon Heo},
  title        = {Responsible {AI} Challenges in End-to-end Machine Learning},
  journal      = {{IEEE} Data Eng. Bull.},
  volume       = {44},
  number       = {1},
  pages        = {79--91},
  year         = {2021},
  url          = {http://sites.computer.org/debull/A21mar/p79.pdf},
  timestamp    = {Fri, 04 Mar 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/debu/WhangTRH21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tkde/RohHW21,
  author       = {Yuji Roh and
                  Geon Heo and
                  Steven Euijong Whang},
  title        = {A Survey on Data Collection for Machine Learning: {A} Big Data - {AI}
                  Integration Perspective},
  journal      = {{IEEE} Trans. Knowl. Data Eng.},
  volume       = {33},
  number       = {4},
  pages        = {1328--1347},
  year         = {2021},
  url          = {https://doi.org/10.1109/TKDE.2019.2946162},
  doi          = {10.1109/TKDE.2019.2946162},
  timestamp    = {Sun, 16 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tkde/RohHW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/Roh0WS21,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Euijong Whang and
                  Changho Suh},
  title        = {FairBatch: Batch Selection for Model Fairness},
  booktitle    = {9th International Conference on Learning Representations, {ICLR} 2021,
                  Virtual Event, Austria, May 3-7, 2021},
  publisher    = {OpenReview.net},
  year         = {2021},
  url          = {https://openreview.net/forum?id=YNnpaAKeCfx},
  timestamp    = {Wed, 23 Jun 2021 17:36:39 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/Roh0WS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/0001RSW21,
  author       = {Jae{-}Gil Lee and
                  Yuji Roh and
                  Hwanjun Song and
                  Steven Euijong Whang},
  editor       = {Feida Zhu and
                  Beng Chin Ooi and
                  Chunyan Miao},
  title        = {Machine Learning Robustness, Fairness, and their Convergence},
  booktitle    = {{KDD} '21: The 27th {ACM} {SIGKDD} Conference on Knowledge Discovery
                  and Data Mining, Virtual Event, Singapore, August 14-18, 2021},
  pages        = {4046--4047},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3447548.3470799},
  doi          = {10.1145/3447548.3470799},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/kdd/0001RSW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/nips/RohLWS21,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Whang and
                  Changho Suh},
  editor       = {Marc'Aurelio Ranzato and
                  Alina Beygelzimer and
                  Yann N. Dauphin and
                  Percy Liang and
                  Jennifer Wortman Vaughan},
  title        = {Sample Selection for Fair and Robust Training},
  booktitle    = {Advances in Neural Information Processing Systems 34: Annual Conference
                  on Neural Information Processing Systems 2021, NeurIPS 2021, December
                  6-14, 2021, virtual},
  pages        = {815--827},
  year         = {2021},
  url          = {https://proceedings.neurips.cc/paper/2021/hash/07563a3fe3bbe7e3ba84431ad9d055af-Abstract.html},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/nips/RohLWS21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigmod/TaeW21,
  author       = {Ki Hyun Tae and
                  Steven Euijong Whang},
  editor       = {Guoliang Li and
                  Zhanhuai Li and
                  Stratos Idreos and
                  Divesh Srivastava},
  title        = {Slice Tuner: {A} Selective Data Acquisition Framework for Accurate
                  and Fair Machine Learning Models},
  booktitle    = {{SIGMOD} '21: International Conference on Management of Data, Virtual
                  Event, China, June 20-25, 2021},
  pages        = {1771--1783},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3448016.3452792},
  doi          = {10.1145/3448016.3452792},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigmod/TaeW21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/sigmod/2021deem,
  editor       = {Matthias Boehm and
                  Julia Stoyanovich and
                  Steven Whang},
  title        = {Proceedings of the Fifth Workshop on Data Management for End-To-End
                  Machine Learning, In conjunction with the 2021 {ACM} {SIGMOD/PODS}
                  Conference, DEEM@SIGMOD 2021, Virtual Event, China, 20 June, 2021},
  publisher    = {{ACM}},
  year         = {2021},
  url          = {https://doi.org/10.1145/3462462},
  doi          = {10.1145/3462462},
  isbn         = {978-1-4503-8486-5},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigmod/2021deem.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2101-05967,
  author       = {Steven Euijong Whang and
                  Ki Hyun Tae and
                  Yuji Roh and
                  Geon Heo},
  title        = {Responsible {AI} Challenges in End-to-end Machine Learning},
  journal      = {CoRR},
  volume       = {abs/2101.05967},
  year         = {2021},
  url          = {https://arxiv.org/abs/2101.05967},
  eprinttype    = {arXiv},
  eprint       = {2101.05967},
  timestamp    = {Fri, 22 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2101-05967.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2106-03374,
  author       = {Seonghyeon Hwang and
                  Steven Euijong Whang},
  title        = {MixRL: Data Mixing Augmentation for Regression using Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2106.03374},
  year         = {2021},
  url          = {https://arxiv.org/abs/2106.03374},
  eprinttype    = {arXiv},
  eprint       = {2106.03374},
  timestamp    = {Thu, 10 Jun 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2106-03374.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2110-14222,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Euijong Whang and
                  Changho Suh},
  title        = {Sample Selection for Fair and Robust Training},
  journal      = {CoRR},
  volume       = {abs/2110.14222},
  year         = {2021},
  url          = {https://arxiv.org/abs/2110.14222},
  eprinttype    = {arXiv},
  eprint       = {2110.14222},
  timestamp    = {Fri, 29 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2110-14222.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2112-06409,
  author       = {Steven Euijong Whang and
                  Yuji Roh and
                  Hwanjun Song and
                  Jae{-}Gil Lee},
  title        = {Data Collection and Quality Challenges in Deep Learning: {A} Data-Centric
                  {AI} Perspective},
  journal      = {CoRR},
  volume       = {abs/2112.06409},
  year         = {2021},
  url          = {https://arxiv.org/abs/2112.06409},
  eprinttype    = {arXiv},
  eprint       = {2112.06409},
  timestamp    = {Mon, 03 Jan 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2112-06409.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/Whang020,
  author       = {Steven Whang and
                  Jae{-}Gil Lee},
  title        = {Data Collection and Quality Challenges for Deep Learning},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {13},
  number       = {12},
  pages        = {3429--3432},
  year         = {2020},
  url          = {http://www.vldb.org/pvldb/vol13/p3429-whang.pdf},
  doi          = {10.14778/3415478.3415562},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/Whang020.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/HeoRHLW20,
  author       = {Geon Heo and
                  Yuji Roh and
                  Seonghyeon Hwang and
                  Dayun Lee and
                  Steven Whang},
  title        = {Inspector Gadget: {A} Data Programming-based Labeling System for Industrial
                  Images},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {14},
  number       = {1},
  pages        = {28--36},
  year         = {2020},
  url          = {http://www.vldb.org/pvldb/vol14/p28-heo.pdf},
  doi          = {10.14778/3421424.3421429},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/HeoRHLW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tkde/ChungKPTW20,
  author       = {Yeounoh Chung and
                  Tim Kraska and
                  Neoklis Polyzotis and
                  Ki Hyun Tae and
                  Steven Euijong Whang},
  title        = {Automated Data Slicing for Model Validation: {A} Big Data - {AI} Integration
                  Approach},
  journal      = {{IEEE} Trans. Knowl. Data Eng.},
  volume       = {32},
  number       = {12},
  pages        = {2284--2296},
  year         = {2020},
  url          = {https://doi.org/10.1109/TKDE.2019.2916074},
  doi          = {10.1109/TKDE.2019.2916074},
  timestamp    = {Thu, 31 Dec 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tkde/ChungKPTW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dmah-ws/HwangW20,
  author       = {Hyunseung Hwang and
                  Steven Euijong Whang},
  editor       = {Vijay Gadepally and
                  Timothy G. Mattson and
                  Michael Stonebraker and
                  Tim Kraska and
                  Fusheng Wang and
                  Gang Luo and
                  Jun Kong and
                  Alevtina Dubovitskaya},
  title        = {Open-World {COVID-19} Data Visualization [Extended Abstract]},
  booktitle    = {Heterogeneous Data Management, Polystores, and Analytics for Healthcare
                  - {VLDB} Workshops, Poly 2020 and {DMAH} 2020, Virtual Event, August
                  31 and September 4, 2020, Revised Selected Papers},
  series       = {Lecture Notes in Computer Science},
  volume       = {12633},
  pages        = {81--84},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-71055-2\_8},
  doi          = {10.1007/978-3-030-71055-2\_8},
  timestamp    = {Wed, 10 Mar 2021 18:50:28 +0100},
  biburl       = {https://dblp.org/rec/conf/dmah-ws/HwangW20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/RohLWS20,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Whang and
                  Changho Suh},
  title        = {FR-Train: {A} Mutual Information-Based Approach to Fair and Robust
                  Training},
  booktitle    = {Proceedings of the 37th International Conference on Machine Learning,
                  {ICML} 2020, 13-18 July 2020, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {119},
  pages        = {8147--8157},
  publisher    = {{PMLR}},
  year         = {2020},
  url          = {http://proceedings.mlr.press/v119/roh20a.html},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icml/RohLWS20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/dasfaa/2020-1,
  editor       = {Yunmook Nah and
                  Bin Cui and
                  Sang{-}Won Lee and
                  Jeffrey Xu Yu and
                  Yang{-}Sae Moon and
                  Steven Euijong Whang},
  title        = {Database Systems for Advanced Applications - 25th International Conference,
                  {DASFAA} 2020, Jeju, South Korea, September 24-27, 2020, Proceedings,
                  Part {I}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12112},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-59410-7},
  doi          = {10.1007/978-3-030-59410-7},
  isbn         = {978-3-030-59409-1},
  timestamp    = {Fri, 25 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/dasfaa/2020-1.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/dasfaa/2020-2,
  editor       = {Yunmook Nah and
                  Bin Cui and
                  Sang{-}Won Lee and
                  Jeffrey Xu Yu and
                  Yang{-}Sae Moon and
                  Steven Euijong Whang},
  title        = {Database Systems for Advanced Applications - 25th International Conference,
                  {DASFAA} 2020, Jeju, South Korea, September 24-27, 2020, Proceedings,
                  Part {II}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12113},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-59416-9},
  doi          = {10.1007/978-3-030-59416-9},
  isbn         = {978-3-030-59415-2},
  timestamp    = {Fri, 25 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/dasfaa/2020-2.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/dasfaa/2020-3,
  editor       = {Yunmook Nah and
                  Bin Cui and
                  Sang{-}Won Lee and
                  Jeffrey Xu Yu and
                  Yang{-}Sae Moon and
                  Steven Euijong Whang},
  title        = {Database Systems for Advanced Applications - 25th International Conference,
                  {DASFAA} 2020, Jeju, South Korea, September 24-27, 2020, Proceedings,
                  Part {III}},
  series       = {Lecture Notes in Computer Science},
  volume       = {12114},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-59419-0},
  doi          = {10.1007/978-3-030-59419-0},
  isbn         = {978-3-030-59418-3},
  timestamp    = {Fri, 25 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/dasfaa/2020-3.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/dasfaa/2020w,
  editor       = {Yunmook Nah and
                  Chulyun Kim and
                  Seon Ho Kim and
                  Yang{-}Sae Moon and
                  Steven Euijong Whang},
  title        = {Database Systems for Advanced Applications. {DASFAA} 2020 International
                  Workshops - BDMS, SeCoP, BDQM, GDMA, and AIDE, Jeju, South Korea,
                  September 24-27, 2020, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {12115},
  publisher    = {Springer},
  year         = {2020},
  url          = {https://doi.org/10.1007/978-3-030-59413-8},
  doi          = {10.1007/978-3-030-59413-8},
  isbn         = {978-3-030-59412-1},
  timestamp    = {Tue, 22 Sep 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/dasfaa/2020w.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@proceedings{DBLP:conf/sigmod/2020deem,
  editor       = {Sebastian Schelter and
                  Steven Whang and
                  Julia Stoyanovich},
  title        = {Proceedings of the Fourth Workshop on Data Management for End-To-End
                  Machine Learning, In conjunction with the 2020 {ACM} {SIGMOD/PODS}
                  Conference, DEEM@SIGMOD 2020, Portland, OR, USA, June 14, 2020},
  publisher    = {{ACM}},
  year         = {2020},
  url          = {https://doi.org/10.1145/3399579},
  doi          = {10.1145/3399579},
  isbn         = {978-1-4503-8023-2},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigmod/2020deem.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2002-10234,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Euijong Whang and
                  Changho Suh},
  title        = {FR-Train: {A} mutual information-based approach to fair and robust
                  training},
  journal      = {CoRR},
  volume       = {abs/2002.10234},
  year         = {2020},
  url          = {https://arxiv.org/abs/2002.10234},
  eprinttype    = {arXiv},
  eprint       = {2002.10234},
  timestamp    = {Mon, 15 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2002-10234.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-04549,
  author       = {Ki Hyun Tae and
                  Steven Euijong Whang},
  title        = {Slice Tuner: {A} Selective Data Collection Framework for Accurate
                  and Fair Machine Learning Models},
  journal      = {CoRR},
  volume       = {abs/2003.04549},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.04549},
  eprinttype    = {arXiv},
  eprint       = {2003.04549},
  timestamp    = {Tue, 17 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-04549.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2004-03264,
  author       = {Geon Heo and
                  Yuji Roh and
                  Seonghyeon Hwang and
                  Dayun Lee and
                  Steven Euijong Whang},
  title        = {Inspector Gadget: {A} Data Programming-based Labeling System for Industrial
                  Images},
  journal      = {CoRR},
  volume       = {abs/2004.03264},
  year         = {2020},
  url          = {https://arxiv.org/abs/2004.03264},
  eprinttype    = {arXiv},
  eprint       = {2004.03264},
  timestamp    = {Wed, 08 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2004-03264.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2012-01696,
  author       = {Yuji Roh and
                  Kangwook Lee and
                  Steven Euijong Whang and
                  Changho Suh},
  title        = {FairBatch: Batch Selection for Model Fairness},
  journal      = {CoRR},
  volume       = {abs/2012.01696},
  year         = {2020},
  url          = {https://arxiv.org/abs/2012.01696},
  eprinttype    = {arXiv},
  eprint       = {2012.01696},
  timestamp    = {Mon, 15 Feb 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2012-01696.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icde/ChungKPTW19,
  author       = {Yeounoh Chung and
                  Tim Kraska and
                  Neoklis Polyzotis and
                  Ki Hyun Tae and
                  Steven Euijong Whang},
  title        = {Slice Finder: Automated Data Slicing for Model Validation},
  booktitle    = {35th {IEEE} International Conference on Data Engineering, {ICDE} 2019,
                  Macao, China, April 8-11, 2019},
  pages        = {1550--1553},
  publisher    = {{IEEE}},
  year         = {2019},
  url          = {https://doi.org/10.1109/ICDE.2019.00139},
  doi          = {10.1109/ICDE.2019.00139},
  timestamp    = {Wed, 16 Oct 2019 14:14:56 +0200},
  biburl       = {https://dblp.org/rec/conf/icde/ChungKPTW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/mlsys/BreckP0WZ19,
  author       = {Eric Breck and
                  Neoklis Polyzotis and
                  Sudip Roy and
                  Steven Whang and
                  Martin Zinkevich},
  editor       = {Ameet Talwalkar and
                  Virginia Smith and
                  Matei Zaharia},
  title        = {Data Validation for Machine Learning},
  booktitle    = {Proceedings of Machine Learning and Systems 2019, MLSys 2019, Stanford,
                  CA, USA, March 31 - April 2, 2019},
  publisher    = {mlsys.org},
  year         = {2019},
  url          = {https://proceedings.mlsys.org/book/267.pdf},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/mlsys/BreckP0WZ19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigmod/TaeROKW19,
  author       = {Ki Hyun Tae and
                  Yuji Roh and
                  Young Hun Oh and
                  Hyunsu Kim and
                  Steven Euijong Whang},
  editor       = {Sebastian Schelter and
                  Neoklis Polyzotis and
                  Stephan Seufert and
                  Manasi Vartak},
  title        = {Data Cleaning for Accurate, Fair, and Robust Models: {A} Big Data
                  - {AI} Integration Approach},
  booktitle    = {Proceedings of the 3rd International Workshop on Data Management for
                  End-to-End Machine Learning, DEEM@SIGMOD 2019, Amsterdam, The Netherlands,
                  June 30, 2019},
  pages        = {5:1--5:4},
  publisher    = {{ACM}},
  year         = {2019},
  url          = {https://doi.org/10.1145/3329486.3329493},
  doi          = {10.1145/3329486.3329493},
  timestamp    = {Wed, 05 Jun 2019 14:52:53 +0200},
  biburl       = {https://dblp.org/rec/conf/sigmod/TaeROKW19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1904-10761,
  author       = {Ki Hyun Tae and
                  Yuji Roh and
                  Young Hun Oh and
                  Hyunsu Kim and
                  Steven Euijong Whang},
  title        = {Data Cleaning for Accurate, Fair, and Robust Models: {A} Big Data
                  - {AI} Integration Approach},
  journal      = {CoRR},
  volume       = {abs/1904.10761},
  year         = {2019},
  url          = {http://arxiv.org/abs/1904.10761},
  eprinttype    = {arXiv},
  eprint       = {1904.10761},
  timestamp    = {Thu, 02 May 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1904-10761.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sigmod/PolyzotisRWZ18,
  author       = {Neoklis Polyzotis and
                  Sudip Roy and
                  Steven Euijong Whang and
                  Martin Zinkevich},
  title        = {Data Lifecycle Challenges in Production Machine Learning: {A} Survey},
  journal      = {{SIGMOD} Rec.},
  volume       = {47},
  number       = {2},
  pages        = {17--28},
  year         = {2018},
  url          = {https://doi.org/10.1145/3299887.3299891},
  doi          = {10.1145/3299887.3299891},
  timestamp    = {Fri, 06 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/sigmod/PolyzotisRWZ18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1807-06068,
  author       = {Yeounoh Chung and
                  Tim Kraska and
                  Neoklis Polyzotis and
                  Steven Euijong Whang},
  title        = {Slice Finder: Automated Data Slicing for Model Validation},
  journal      = {CoRR},
  volume       = {abs/1807.06068},
  year         = {2018},
  url          = {http://arxiv.org/abs/1807.06068},
  eprinttype    = {arXiv},
  eprint       = {1807.06068},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1807-06068.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-03402,
  author       = {Yuji Roh and
                  Geon Heo and
                  Steven Euijong Whang},
  title        = {A Survey on Data Collection for Machine Learning: a Big Data - {AI}
                  Integration Perspective},
  journal      = {CoRR},
  volume       = {abs/1811.03402},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.03402},
  eprinttype    = {arXiv},
  eprint       = {1811.03402},
  timestamp    = {Fri, 23 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-03402.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/kdd/BaylorBCFFHHIJK17,
  author       = {Denis Baylor and
                  Eric Breck and
                  Heng{-}Tze Cheng and
                  Noah Fiedel and
                  Chuan Yu Foo and
                  Zakaria Haque and
                  Salem Haykal and
                  Mustafa Ispir and
                  Vihan Jain and
                  Levent Koc and
                  Chiu Yuen Koo and
                  Lukasz Lew and
                  Clemens Mewald and
                  Akshay Naresh Modi and
                  Neoklis Polyzotis and
                  Sukriti Ramesh and
                  Sudip Roy and
                  Steven Euijong Whang and
                  Martin Wicke and
                  Jarek Wilkiewicz and
                  Xin Zhang and
                  Martin Zinkevich},
  title        = {{TFX:} {A} TensorFlow-Based Production-Scale Machine Learning Platform},
  booktitle    = {Proceedings of the 23rd {ACM} {SIGKDD} International Conference on
                  Knowledge Discovery and Data Mining, Halifax, NS, Canada, August 13
                  - 17, 2017},
  pages        = {1387--1395},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3097983.3098021},
  doi          = {10.1145/3097983.3098021},
  timestamp    = {Fri, 25 Dec 2020 01:14:16 +0100},
  biburl       = {https://dblp.org/rec/conf/kdd/BaylorBCFFHHIJK17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigmod/Polyzotis0WZ17,
  author       = {Neoklis Polyzotis and
                  Sudip Roy and
                  Steven Euijong Whang and
                  Martin Zinkevich},
  editor       = {Semih Salihoglu and
                  Wenchao Zhou and
                  Rada Chirkova and
                  Jun Yang and
                  Dan Suciu},
  title        = {Data Management Challenges in Production Machine Learning},
  booktitle    = {Proceedings of the 2017 {ACM} International Conference on Management
                  of Data, {SIGMOD} Conference 2017, Chicago, IL, USA, May 14-19, 2017},
  pages        = {1723--1726},
  publisher    = {{ACM}},
  year         = {2017},
  url          = {https://doi.org/10.1145/3035918.3054782},
  doi          = {10.1145/3035918.3054782},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/sigmod/Polyzotis0WZ17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/debu/HalevyKNOPRW16,
  author       = {Alon Y. Halevy and
                  Flip Korn and
                  Natalya Fridman Noy and
                  Christopher Olston and
                  Neoklis Polyzotis and
                  Sudip Roy and
                  Steven Euijong Whang},
  title        = {Managing Google's data lake: an overview of the Goods system},
  journal      = {{IEEE} Data Eng. Bull.},
  volume       = {39},
  number       = {3},
  pages        = {5--14},
  year         = {2016},
  url          = {http://sites.computer.org/debull/A16sept/p5.pdf},
  timestamp    = {Tue, 10 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/debu/HalevyKNOPRW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigir/FaridIWY16,
  author       = {Mina H. Farid and
                  Ihab F. Ilyas and
                  Steven Euijong Whang and
                  Cong Yu},
  editor       = {Raffaele Perego and
                  Fabrizio Sebastiani and
                  Javed A. Aslam and
                  Ian Ruthven and
                  Justin Zobel},
  title        = {{LONLIES:} Estimating Property Values for Long Tail Entities},
  booktitle    = {Proceedings of the 39th International {ACM} {SIGIR} conference on
                  Research and Development in Information Retrieval, {SIGIR} 2016, Pisa,
                  Italy, July 17-21, 2016},
  pages        = {1125--1128},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {https://doi.org/10.1145/2911451.2911466},
  doi          = {10.1145/2911451.2911466},
  timestamp    = {Wed, 14 Nov 2018 10:58:11 +0100},
  biburl       = {https://dblp.org/rec/conf/sigir/FaridIWY16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigmod/HalevyKNOPRW16,
  author       = {Alon Y. Halevy and
                  Flip Korn and
                  Natalya Fridman Noy and
                  Christopher Olston and
                  Neoklis Polyzotis and
                  Sudip Roy and
                  Steven Euijong Whang},
  editor       = {Fatma {\"{O}}zcan and
                  Georgia Koutrika and
                  Sam Madden},
  title        = {Goods: Organizing Google's Datasets},
  booktitle    = {Proceedings of the 2016 International Conference on Management of
                  Data, {SIGMOD} Conference 2016, San Francisco, CA, USA, June 26 -
                  July 01, 2016},
  pages        = {795--806},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {https://doi.org/10.1145/2882903.2903730},
  doi          = {10.1145/2882903.2903730},
  timestamp    = {Wed, 14 Nov 2018 10:56:20 +0100},
  biburl       = {https://dblp.org/rec/conf/sigmod/HalevyKNOPRW16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/www/HalevyNSWY16,
  author       = {Alon Y. Halevy and
                  Natalya Fridman Noy and
                  Sunita Sarawagi and
                  Steven Euijong Whang and
                  Xiao Yu},
  editor       = {Jacqueline Bourdeau and
                  Jim Hendler and
                  Roger Nkambou and
                  Ian Horrocks and
                  Ben Y. Zhao},
  title        = {Discovering Structure in the Universe of Attribute Names},
  booktitle    = {Proceedings of the 25th International Conference on World Wide Web,
                  {WWW} 2016, Montreal, Canada, April 11 - 15, 2016},
  pages        = {939--949},
  publisher    = {{ACM}},
  year         = {2016},
  url          = {https://doi.org/10.1145/2872427.2882975},
  doi          = {10.1145/2872427.2882975},
  timestamp    = {Tue, 12 Apr 2022 14:46:29 +0200},
  biburl       = {https://dblp.org/rec/conf/www/HalevyNSWY16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/webdb/Movshovitz-Attias15,
  author       = {Dana Movshovitz{-}Attias and
                  Steven Euijong Whang and
                  Natalya Fridman Noy and
                  Alon Y. Halevy},
  editor       = {Julia Stoyanovich and
                  Fabian M. Suchanek},
  title        = {Discovering Subsumption Relationships for Web-Based Ontologies},
  booktitle    = {Proceedings of the 18th International Workshop on Web and Databases,
                  Melbourne, VIC, Australia, May 31, 2015},
  pages        = {62--69},
  publisher    = {{ACM}},
  year         = {2015},
  url          = {https://doi.org/10.1145/2767109.2767111},
  doi          = {10.1145/2767109.2767111},
  timestamp    = {Tue, 06 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/webdb/Movshovitz-Attias15.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/GuptaHWWW14,
  author       = {Rahul Gupta and
                  Alon Y. Halevy and
                  Xuezhi Wang and
                  Steven Euijong Whang and
                  Fei Wu},
  title        = {Biperpedia: An Ontology for Search Applications},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {7},
  number       = {7},
  pages        = {505--516},
  year         = {2014},
  url          = {http://www.vldb.org/pvldb/vol7/p505-gupta.pdf},
  doi          = {10.14778/2732286.2732288},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/GuptaHWWW14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/vldb/WhangG14,
  author       = {Steven Euijong Whang and
                  Hector Garcia{-}Molina},
  title        = {Incremental entity resolution on rules and data},
  journal      = {{VLDB} J.},
  volume       = {23},
  number       = {1},
  pages        = {77--102},
  year         = {2014},
  url          = {https://doi.org/10.1007/s00778-013-0315-0},
  doi          = {10.1007/S00778-013-0315-0},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/vldb/WhangG14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/emnlp/YahyaWGH14,
  author       = {Mohamed Yahya and
                  Steven Whang and
                  Rahul Gupta and
                  Alon Y. Halevy},
  editor       = {Alessandro Moschitti and
                  Bo Pang and
                  Walter Daelemans},
  title        = {ReNoun: Fact Extraction for Nominal Attributes},
  booktitle    = {Proceedings of the 2014 Conference on Empirical Methods in Natural
                  Language Processing, {EMNLP} 2014, October 25-29, 2014, Doha, Qatar,
                  {A} meeting of SIGDAT, a Special Interest Group of the {ACL}},
  pages        = {325--335},
  publisher    = {{ACL}},
  year         = {2014},
  url          = {https://doi.org/10.3115/v1/d14-1038},
  doi          = {10.3115/V1/D14-1038},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/emnlp/YahyaWGH14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/WhangLG13,
  author       = {Steven Euijong Whang and
                  Peter Lofgren and
                  Hector Garcia{-}Molina},
  title        = {Question Selection for Crowd Entity Resolution},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {6},
  number       = {6},
  pages        = {349--360},
  year         = {2013},
  url          = {http://www.vldb.org/pvldb/vol6/p349-whang.pdf},
  doi          = {10.14778/2536336.2536337},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/WhangLG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tkde/WhangMG13,
  author       = {Steven Euijong Whang and
                  David Marmaros and
                  Hector Garcia{-}Molina},
  title        = {Pay-As-You-Go Entity Resolution},
  journal      = {{IEEE} Trans. Knowl. Data Eng.},
  volume       = {25},
  number       = {5},
  pages        = {1111--1124},
  year         = {2013},
  url          = {https://doi.org/10.1109/TKDE.2012.43},
  doi          = {10.1109/TKDE.2012.43},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tkde/WhangMG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/vldb/WhangG13,
  author       = {Steven Euijong Whang and
                  Hector Garcia{-}Molina},
  title        = {Joint entity resolution on multiple datasets},
  journal      = {{VLDB} J.},
  volume       = {22},
  number       = {6},
  pages        = {773--795},
  year         = {2013},
  url          = {https://doi.org/10.1007/s00778-013-0308-z},
  doi          = {10.1007/S00778-013-0308-Z},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/vldb/WhangG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cikm/WhangG13,
  author       = {Steven Euijong Whang and
                  Hector Garcia{-}Molina},
  editor       = {Qi He and
                  Arun Iyengar and
                  Wolfgang Nejdl and
                  Jian Pei and
                  Rajeev Rastogi},
  title        = {Disinformation techniques for entity resolution},
  booktitle    = {22nd {ACM} International Conference on Information and Knowledge Management,
                  CIKM'13, San Francisco, CA, USA, October 27 - November 1, 2013},
  pages        = {715--720},
  publisher    = {{ACM}},
  year         = {2013},
  url          = {https://doi.org/10.1145/2505515.2505636},
  doi          = {10.1145/2505515.2505636},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cikm/WhangG13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@phdthesis{DBLP:phd/us/Whang12,
  author       = {Steven Euijong Whang},
  title        = {Data analytics: integration and privacy},
  school       = {Stanford University, {USA}},
  year         = {2012},
  url          = {https://searchworks.stanford.edu/view/9625291},
  timestamp    = {Fri, 02 Sep 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/phd/us/Whang12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icde/WhangG12,
  author       = {Steven Euijong Whang and
                  Hector Garcia{-}Molina},
  editor       = {Anastasios Kementsietsidis and
                  Marcos Antonio Vaz Salles},
  title        = {Joint Entity Resolution},
  booktitle    = {{IEEE} 28th International Conference on Data Engineering {(ICDE} 2012),
                  Washington, DC, {USA} (Arlington, Virginia), 1-5 April, 2012},
  pages        = {294--305},
  publisher    = {{IEEE} Computer Society},
  year         = {2012},
  url          = {https://doi.org/10.1109/ICDE.2012.119},
  doi          = {10.1109/ICDE.2012.119},
  timestamp    = {Fri, 24 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icde/WhangG12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sdmw/WhangG12,
  author       = {Steven Euijong Whang and
                  Hector Garcia{-}Molina},
  editor       = {Willem Jonker and
                  Milan Petkovic},
  title        = {A Model for Quantifying Information Leakage},
  booktitle    = {Secure Data Management - 9th {VLDB} Workshop, {SDM} 2012, Istanbul,
                  Turkey, August 27, 2012. Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {7482},
  pages        = {25--44},
  publisher    = {Springer},
  year         = {2012},
  url          = {https://doi.org/10.1007/978-3-642-32873-2\_3},
  doi          = {10.1007/978-3-642-32873-2\_3},
  timestamp    = {Tue, 14 May 2019 10:00:38 +0200},
  biburl       = {https://dblp.org/rec/conf/sdmw/WhangG12.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/debu/WhangG11,
  author       = {Steven Euijong Whang and
                  Hector Garcia{-}Molina},
  title        = {Developments in Generic Entity Resolution},
  journal      = {{IEEE} Data Eng. Bull.},
  volume       = {34},
  number       = {3},
  pages        = {51--59},
  year         = {2011},
  url          = {http://sites.computer.org/debull/A11sept/whang1.pdf},
  timestamp    = {Tue, 10 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/debu/WhangG11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/cidr/WhangG11,
  author       = {Steven Whang and
                  Hector Garcia{-}Molina},
  title        = {Managing Information Leakage},
  booktitle    = {Fifth Biennial Conference on Innovative Data Systems Research, {CIDR}
                  2011, Asilomar, CA, USA, January 9-12, 2011, Online Proceedings},
  pages        = {79--84},
  publisher    = {www.cidrdb.org},
  year         = {2011},
  url          = {http://cidrdb.org/cidr2011/Papers/CIDR11\_Paper9.pdf},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/cidr/WhangG11.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/MenestrinaWG10,
  author       = {David Menestrina and
                  Steven Whang and
                  Hector Garcia{-}Molina},
  title        = {Evaluating Entity Resolution Results},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {3},
  number       = {1},
  pages        = {208--219},
  year         = {2010},
  url          = {http://www.vldb.org/pvldb/vldb2010/pvldb\_vol3/R18.pdf},
  doi          = {10.14778/1920841.1920871},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/MenestrinaWG10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/WhangG10,
  author       = {Steven Whang and
                  Hector Garcia{-}Molina},
  title        = {Entity Resolution with Evolving Rules},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {3},
  number       = {1},
  pages        = {1326--1337},
  year         = {2010},
  url          = {http://www.vldb.org/pvldb/vldb2010/pvldb\_vol3/R117.pdf},
  doi          = {10.14778/1920841.1921004},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/WhangG10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/pvldb/WhangBSVVYG09,
  author       = {Steven Whang and
                  Chad Brower and
                  Jayavel Shanmugasundaram and
                  Sergei Vassilvitskii and
                  Erik Vee and
                  Ramana Yerneni and
                  Hector Garcia{-}Molina},
  title        = {Indexing Boolean Expressions},
  journal      = {Proc. {VLDB} Endow.},
  volume       = {2},
  number       = {1},
  pages        = {37--48},
  year         = {2009},
  url          = {http://www.vldb.org/pvldb/vol2/vldb09-83.pdf},
  doi          = {10.14778/1687627.1687633},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/pvldb/WhangBSVVYG09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/vldb/BenjellounGMSWW09,
  author       = {Omar Benjelloun and
                  Hector Garcia{-}Molina and
                  David Menestrina and
                  Qi Su and
                  Steven Euijong Whang and
                  Jennifer Widom},
  title        = {Swoosh: a generic approach to entity resolution},
  journal      = {{VLDB} J.},
  volume       = {18},
  number       = {1},
  pages        = {255--276},
  year         = {2009},
  url          = {https://doi.org/10.1007/s00778-008-0098-x},
  doi          = {10.1007/S00778-008-0098-X},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/vldb/BenjellounGMSWW09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/vldb/WhangBG09,
  author       = {Steven Euijong Whang and
                  Omar Benjelloun and
                  Hector Garcia{-}Molina},
  title        = {Generic entity resolution with negative rules},
  journal      = {{VLDB} J.},
  volume       = {18},
  number       = {6},
  pages        = {1261--1277},
  year         = {2009},
  url          = {https://doi.org/10.1007/s00778-009-0136-3},
  doi          = {10.1007/S00778-009-0136-3},
  timestamp    = {Mon, 26 Jun 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/vldb/WhangBG09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icde/CastellanosJCZWD09,
  author       = {Mal{\'{u}} Castellanos and
                  Ivo Jimenez and
                  Neal Coddington and
                  Hans Zeller and
                  Steven Whang and
                  Umeshwar Dayal},
  editor       = {Yannis E. Ioannidis and
                  Dik Lun Lee and
                  Raymond T. Ng},
  title        = {QuickStart: An Upfront Client-Based Design Advisor for Parallel Data
                  Warehouses},
  booktitle    = {Proceedings of the 25th International Conference on Data Engineering,
                  {ICDE} 2009, March 29 2009 - April 2 2009, Shanghai, China},
  pages        = {1543--1546},
  publisher    = {{IEEE} Computer Society},
  year         = {2009},
  url          = {https://doi.org/10.1109/ICDE.2009.169},
  doi          = {10.1109/ICDE.2009.169},
  timestamp    = {Fri, 15 Sep 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icde/CastellanosJCZWD09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/sigmod/WhangMKTG09,
  author       = {Steven Euijong Whang and
                  David Menestrina and
                  Georgia Koutrika and
                  Martin Theobald and
                  Hector Garcia{-}Molina},
  editor       = {Ugur {\c{C}}etintemel and
                  Stanley B. Zdonik and
                  Donald Kossmann and
                  Nesime Tatbul},
  title        = {Entity resolution with iterative blocking},
  booktitle    = {Proceedings of the {ACM} {SIGMOD} International Conference on Management
                  of Data, {SIGMOD} 2009, Providence, Rhode Island, USA, June 29 - July
                  2, 2009},
  pages        = {219--232},
  publisher    = {{ACM}},
  year         = {2009},
  url          = {https://doi.org/10.1145/1559845.1559870},
  doi          = {10.1145/1559845.1559870},
  timestamp    = {Thu, 14 Oct 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/sigmod/WhangMKTG09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/dasfaa/LeeKWL06,
  author       = {Ki{-}Hoon Lee and
                  Seoyoung Kim and
                  Euijong Whang and
                  Jae{-}Gil Lee},
  editor       = {Mong{-}Li Lee and
                  Kian{-}Lee Tan and
                  Vilas Wuwongse},
  title        = {A Practitioner's Approach to Normalizing XQuery Expressions},
  booktitle    = {Database Systems for Advanced Applications, 11th International Conference,
                  {DASFAA} 2006, Singapore, April 12-15, 2006, Proceedings},
  series       = {Lecture Notes in Computer Science},
  volume       = {3882},
  pages        = {437--453},
  publisher    = {Springer},
  year         = {2006},
  url          = {https://doi.org/10.1007/11733836\_31},
  doi          = {10.1007/11733836\_31},
  timestamp    = {Sat, 28 Aug 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/dasfaa/LeeKWL06.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
a service of  Schloss Dagstuhl - Leibniz Center for Informatics