[go: up one dir, main page]

BibTeX records: Takayuki Osa

download as .bib file

@inproceedings{DBLP:conf/humanoids/ArakiMOH25,
  author       = {Tomoyuki Araki and
                  Yusuke Mukuta and
                  Takayuki Osa and
                  Tatsuya Harada},
  title        = {Few-shot Imitation Learning by Variable-Length Trajectory Retrieval
                  from a Large and Diverse Dataset},
  booktitle    = {24th {IEEE-RAS} International Conference on Humanoid Robots, Humanoids
                  2025, Seoul, Republic of Korea, September 30 - October 2, 2025},
  pages        = {829--836},
  publisher    = {{IEEE}},
  year         = {2025},
  url          = {https://doi.org/10.1109/Humanoids65713.2025.11203120},
  doi          = {10.1109/HUMANOIDS65713.2025.11203120},
  timestamp    = {Tue, 04 Nov 2025 09:03:19 +0100},
  biburl       = {https://dblp.org/rec/conf/humanoids/ArakiMOH25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/OmuraOOMH25,
  author       = {Motoki Omura and
                  Kazuki Ota and
                  Takayuki Osa and
                  Yusuke Mukuta and
                  Tatsuya Harada},
  editor       = {Aarti Singh and
                  Maryam Fazel and
                  Daniel Hsu and
                  Simon Lacoste{-}Julien and
                  Felix Berkenkamp and
                  Tegan Maharaj and
                  Kiri Wagstaff and
                  Jerry Zhu},
  title        = {Gradual Transition from Bellman Optimality Operator to Bellman Operator
                  in Online Reinforcement Learning},
  booktitle    = {Forty-second International Conference on Machine Learning, {ICML}
                  2025, Vancouver, BC, Canada, July 13-19, 2025},
  series       = {Proceedings of Machine Learning Research},
  volume       = {267},
  publisher    = {{PMLR} / OpenReview.net},
  year         = {2025},
  url          = {https://proceedings.mlr.press/v267/omura25a.html},
  timestamp    = {Wed, 04 Feb 2026 16:54:16 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/OmuraOOMH25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/YoshimitsuOAI25,
  author       = {Yuhei Yoshimitsu and
                  Takayuki Osa and
                  Heni Ben Amor and
                  Shuhei Ikemoto},
  title        = {Uncertainty-aware Motion Planning based on Stochastic Forward/Inverse
                  Kinematics Models for Tensegrity Manipulators},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2025, Hangzhou, China, October 19-25, 2025},
  pages        = {21657--21663},
  publisher    = {{IEEE}},
  year         = {2025},
  url          = {https://doi.org/10.1109/IROS60139.2025.11246289},
  doi          = {10.1109/IROS60139.2025.11246289},
  timestamp    = {Wed, 07 Jan 2026 13:35:46 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/YoshimitsuOAI25.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2506-05968,
  author       = {Motoki Omura and
                  Kazuki Ota and
                  Takayuki Osa and
                  Yusuke Mukuta and
                  Tatsuya Harada},
  title        = {Gradual Transition from Bellman Optimality Operator to Bellman Operator
                  in Online Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2506.05968},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2506.05968},
  doi          = {10.48550/ARXIV.2506.05968},
  eprinttype    = {arXiv},
  eprint       = {2506.05968},
  timestamp    = {Mon, 07 Jul 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2506-05968.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2507-10843,
  author       = {Motoki Omura and
                  Yusuke Mukuta and
                  Kazuki Ota and
                  Takayuki Osa and
                  Tatsuya Harada},
  title        = {Offline Reinforcement Learning with Wasserstein Regularization via
                  Optimal Transport Maps},
  journal      = {CoRR},
  volume       = {abs/2507.10843},
  year         = {2025},
  url          = {https://doi.org/10.48550/arXiv.2507.10843},
  doi          = {10.48550/ARXIV.2507.10843},
  eprinttype    = {arXiv},
  eprint       = {2507.10843},
  timestamp    = {Thu, 14 Aug 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2507-10843.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:conf/rlc/OmuraOMH24,
  author       = {Motoki Omura and
                  Takayuki Osa and
                  Yusuke Mukuta and
                  Tatsuya Harada},
  title        = {Stabilizing Extreme Q-learning by Maclaurin Expansion},
  journal      = {{RLJ}},
  volume       = {3},
  pages        = {1427--1440},
  year         = {2024},
  url          = {https://rlj.cs.umass.edu/2024/papers/Paper171.html},
  timestamp    = {Wed, 26 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rlc/OmuraOMH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:conf/rlc/AckermannOS24,
  author       = {Johannes Ackermann and
                  Takayuki Osa and
                  Masashi Sugiyama},
  title        = {Offline Reinforcement Learning from Datasets with Structured Non-Stationarity},
  journal      = {{RLJ}},
  volume       = {5},
  pages        = {2140--2161},
  year         = {2024},
  url          = {https://rlj.cs.umass.edu/2024/papers/Paper287.html},
  timestamp    = {Wed, 26 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rlc/AckermannOS24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/ChangWOH24,
  author       = {Jen{-}Yen Chang and
                  Thomas Westfechtel and
                  Takayuki Osa and
                  Tatsuya Harada},
  title        = {Offline Deep Reinforcement Learning for Visual Distractions via Domain
                  Adversarial Training},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2024},
  year         = {2024},
  url          = {https://openreview.net/forum?id=dce6ZGkJ1Z},
  timestamp    = {Mon, 16 Jun 2025 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/ChangWOH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/OmuraOMH24,
  author       = {Motoki Omura and
                  Takayuki Osa and
                  Yusuke Mukuta and
                  Tatsuya Harada},
  editor       = {Michael J. Wooldridge and
                  Jennifer G. Dy and
                  Sriraam Natarajan},
  title        = {Symmetric Q-learning: Reducing Skewness of Bellman Error in Online
                  Reinforcement Learning},
  booktitle    = {Thirty-Eighth {AAAI} Conference on Artificial Intelligence, {AAAI}
                  2024, Thirty-Sixth Conference on Innovative Applications of Artificial
                  Intelligence, {IAAI} 2024, Fourteenth Symposium on Educational Advances
                  in Artificial Intelligence, {EAAI} 2014, February 20-27, 2024, Vancouver,
                  Canada},
  pages        = {14474--14481},
  publisher    = {{AAAI} Press},
  year         = {2024},
  url          = {https://doi.org/10.1609/aaai.v38i13.29362},
  doi          = {10.1609/AAAI.V38I13.29362},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/OmuraOMH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/humanoids/AbeOOCH24,
  author       = {Haruki Abe and
                  Takayuki Osa and
                  Motoki Omura and
                  Jen{-}Yen Chang and
                  Tatsuya Harada},
  title        = {Latent Space Curriculum Reinforcement Learning in High-Dimensional
                  Contextual Spaces and Its Application to Robotic Piano Playing},
  booktitle    = {23rd {IEEE-RAS} International Conference on Humanoid Robots, Humanoids
                  2024, Nancy, France, November 22-24, 2024},
  pages        = {266--273},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/Humanoids58906.2024.10769872},
  doi          = {10.1109/HUMANOIDS58906.2024.10769872},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/humanoids/AbeOOCH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icml/OsaH24,
  author       = {Takayuki Osa and
                  Tatsuya Harada},
  editor       = {Ruslan Salakhutdinov and
                  Zico Kolter and
                  Katherine A. Heller and
                  Adrian Weller and
                  Nuria Oliver and
                  Jonathan Scarlett and
                  Felix Berkenkamp},
  title        = {Discovering Multiple Solutions from a Single Task in Offline Reinforcement
                  Learning},
  booktitle    = {Forty-first International Conference on Machine Learning, {ICML} 2024,
                  Vienna, Austria, July 21-27, 2024},
  series       = {Proceedings of Machine Learning Research},
  volume       = {235},
  pages        = {38864--38884},
  publisher    = {{PMLR} / OpenReview.net},
  year         = {2024},
  url          = {https://proceedings.mlr.press/v235/osa24a.html},
  timestamp    = {Mon, 09 Feb 2026 15:35:36 +0100},
  biburl       = {https://dblp.org/rec/conf/icml/OsaH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/ONeillRMGPLPGMJ24,
  author       = {Abby O'Neill and
                  Abdul Rehman and
                  Abhiram Maddukuri and
                  Abhishek Gupta and
                  Abhishek Padalkar and
                  Abraham Lee and
                  Acorn Pooley and
                  Agrim Gupta and
                  Ajay Mandlekar and
                  Ajinkya Jain and
                  Albert Tung and
                  Alex Bewley and
                  Alexander Herzog and
                  Alex Irpan and
                  Alexander Khazatsky and
                  Anant Rai and
                  Anchit Gupta and
                  Andrew E. Wang and
                  Anikait Singh and
                  Animesh Garg and
                  Aniruddha Kembhavi and
                  Annie Xie and
                  Anthony Brohan and
                  Antonin Raffin and
                  Archit Sharma and
                  Arefeh Yavary and
                  Arhan Jain and
                  Ashwin Balakrishna and
                  Ayzaan Wahid and
                  Ben Burgess{-}Limerick and
                  Beomjoon Kim and
                  Bernhard Sch{\"{o}}lkopf and
                  Blake Wulfe and
                  Brian Ichter and
                  Cewu Lu and
                  Charles Xu and
                  Charlotte Le and
                  Chelsea Finn and
                  Chen Wang and
                  Chenfeng Xu and
                  Cheng Chi and
                  Chenguang Huang and
                  Christine Chan and
                  Christopher Agia and
                  Chuer Pan and
                  Chuyuan Fu and
                  Coline Devin and
                  Danfei Xu and
                  Daniel Morton and
                  Danny Driess and
                  Daphne Chen and
                  Deepak Pathak and
                  Dhruv Shah and
                  Dieter B{\"{u}}chler and
                  Dinesh Jayaraman and
                  Dmitry Kalashnikov and
                  Dorsa Sadigh and
                  Edward Johns and
                  Ethan Paul Foster and
                  Fangchen Liu and
                  Federico Ceola and
                  Fei Xia and
                  Feiyu Zhao and
                  Freek Stulp and
                  Gaoyue Zhou and
                  Gaurav S. Sukhatme and
                  Gautam Salhotra and
                  Ge Yan and
                  Gilbert Feng and
                  Giulio Schiavi and
                  Glen Berseth and
                  Gregory Kahn and
                  Guanzhi Wang and
                  Hao Su and
                  Haoshu Fang and
                  Haochen Shi and
                  Henghui Bao and
                  Heni Ben Amor and
                  Henrik I. Christensen and
                  Hiroki Furuta and
                  Homer Walke and
                  Hongjie Fang and
                  Huy Ha and
                  Igor Mordatch and
                  Ilija Radosavovic and
                  Isabel Leal and
                  Jacky Liang and
                  Jad Abou{-}Chakra and
                  Jaehyung Kim and
                  Jaimyn Drake and
                  Jan Peters and
                  Jan Schneider and
                  Jasmine Hsu and
                  Jeannette Bohg and
                  Jeffrey T. Bingham and
                  Jeffrey Wu and
                  Jensen Gao and
                  Jiaheng Hu and
                  Jiajun Wu and
                  Jialin Wu and
                  Jiankai Sun and
                  Jianlan Luo and
                  Jiayuan Gu and
                  Jie Tan and
                  Jihoon Oh and
                  Jimmy Wu and
                  Jingpei Lu and
                  Jingyun Yang and
                  Jitendra Malik and
                  Jo{\~{a}}o Silv{\'{e}}rio and
                  Joey Hejna and
                  Jonathan Booher and
                  Jonathan Tompson and
                  Jonathan Yang and
                  Jordi Salvador and
                  Joseph J. Lim and
                  Junhyek Han and
                  Kaiyuan Wang and
                  Kanishka Rao and
                  Karl Pertsch and
                  Karol Hausman and
                  Keegan Go and
                  Keerthana Gopalakrishnan and
                  Ken Goldberg and
                  Kendra Byrne and
                  Kenneth Oslund and
                  Kento Kawaharazuka and
                  Kevin Black and
                  Kevin Lin and
                  Kevin Zhang and
                  Kiana Ehsani and
                  Kiran Lekkala and
                  Kirsty Ellis and
                  Krishan Rana and
                  Krishnan Srinivasan and
                  Kuan Fang and
                  Kunal Pratap Singh and
                  Kuo{-}Hao Zeng and
                  Kyle Hatch and
                  Kyle Hsu and
                  Laurent Itti and
                  Lawrence Yunliang Chen and
                  Lerrel Pinto and
                  Li Fei{-}Fei and
                  Liam Tan and
                  Linxi Jim Fan and
                  Lionel Ott and
                  Lisa Lee and
                  Luca Weihs and
                  Magnum Chen and
                  Marion Lepert and
                  Marius Memmel and
                  Masayoshi Tomizuka and
                  Masha Itkina and
                  Mateo Guaman Castro and
                  Max Spero and
                  Maximilian Du and
                  Michael Ahn and
                  Michael C. Yip and
                  Mingtong Zhang and
                  Mingyu Ding and
                  Minho Heo and
                  Mohan Kumar Srirama and
                  Mohit Sharma and
                  Moo Jin Kim and
                  Naoaki Kanazawa and
                  Nicklas Hansen and
                  Nicolas Heess and
                  Nikhil J. Joshi and
                  Niko S{\"{u}}nderhauf and
                  Ning Liu and
                  Norman Di Palo and
                  Nur Muhammad (Mahi) Shafiullah and
                  Oier Mees and
                  Oliver Kroemer and
                  Osbert Bastani and
                  Pannag R. Sanketi and
                  Patrick Tree Miller and
                  Patrick Yin and
                  Paul Wohlhart and
                  Peng Xu and
                  Peter David Fagan and
                  Peter Mitrano and
                  Pierre Sermanet and
                  Pieter Abbeel and
                  Priya Sundaresan and
                  Qiuyu Chen and
                  Quan Vuong and
                  Rafael Rafailov and
                  Ran Tian and
                  Ria Doshi and
                  Roberto Mart{\'{\i}}n{-}Mart{\'{\i}}n and
                  Rohan Baijal and
                  Rosario Scalise and
                  Rose Hendrix and
                  Roy Lin and
                  Runjia Qian and
                  Ruohan Zhang and
                  Russell Mendonca and
                  Rutav Shah and
                  Ryan Hoque and
                  Ryan Julian and
                  Samuel Bustamante{-}Gomez and
                  Sean Kirmani and
                  Sergey Levine and
                  Shan Lin and
                  Sherry Moore and
                  Shikhar Bahl and
                  Shivin Dass and
                  Shubham D. Sonawani and
                  Shuran Song and
                  Sichun Xu and
                  Siddhant Haldar and
                  Siddharth Karamcheti and
                  Simeon Adebola and
                  Simon Guist and
                  Soroush Nasiriany and
                  Stefan Schaal and
                  Stefan Welker and
                  Stephen Tian and
                  Subramanian Ramamoorthy and
                  Sudeep Dasari and
                  Suneel Belkhale and
                  Sungjae Park and
                  Suraj Nair and
                  Suvir Mirchandani and
                  Takayuki Osa and
                  Tanmay Gupta and
                  Tatsuya Harada and
                  Tatsuya Matsushima and
                  Ted Xiao and
                  Thomas Kollar and
                  Tianhe Yu and
                  Tianli Ding and
                  Todor Davchev and
                  Tony Z. Zhao and
                  Travis Armstrong and
                  Trevor Darrell and
                  Trinity Chung and
                  Vidhi Jain and
                  Vincent Vanhoucke and
                  Wei Zhan and
                  Wenxuan Zhou and
                  Wolfram Burgard and
                  Xi Chen and
                  Xiaolong Wang and
                  Xinghao Zhu and
                  Xinyang Geng and
                  Xiyuan Liu and
                  Liangwei Xu and
                  Xuanlin Li and
                  Yao Lu and
                  Yecheng Jason Ma and
                  Yejin Kim and
                  Yevgen Chebotar and
                  Yifan Zhou and
                  Yifeng Zhu and
                  Yilin Wu and
                  Ying Xu and
                  Yixuan Wang and
                  Yonatan Bisk and
                  Yoonyoung Cho and
                  Youngwoon Lee and
                  Yuchen Cui and
                  Yue Cao and
                  Yueh{-}Hua Wu and
                  Yujin Tang and
                  Yuke Zhu and
                  Yunchu Zhang and
                  Yunfan Jiang and
                  Yunshuang Li and
                  Yunzhu Li and
                  Yusuke Iwasawa and
                  Yutaka Matsuo and
                  Zehan Ma and
                  Zhuo Xu and
                  Zichen Jeff Cui and
                  Zichen Zhang and
                  Zipeng Lin},
  title        = {Open X-Embodiment: Robotic Learning Datasets and {RT-X} Models : Open
                  X-Embodiment Collaboration},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2024, Yokohama, Japan, May 13-17, 2024},
  pages        = {6892--6903},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICRA57147.2024.10611477},
  doi          = {10.1109/ICRA57147.2024.10611477},
  timestamp    = {Thu, 25 Dec 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/ONeillRMGPLPGMJ24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/MorihiraDBHHOO24,
  author       = {Naoki Morihira and
                  Pranav Deo and
                  Manoj Bhadu and
                  Akinobu Hayashi and
                  Tadaaki Hasegawa and
                  Satoshi Otsubo and
                  Takayuki Osa},
  title        = {Touch-Based Manipulation with Multi-Fingered Robot using Off-policy
                  {RL} and Temporal Contrastive Learning},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2024, Yokohama, Japan, May 13-17, 2024},
  pages        = {7501--7507},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICRA57147.2024.10610239},
  doi          = {10.1109/ICRA57147.2024.10610239},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icra/MorihiraDBHHOO24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OsaH24,
  author       = {Takayuki Osa and
                  Tatsuya Harada},
  title        = {Robustifying a Policy in Multi-Agent {RL} with Diverse Cooperative
                  Behaviors and Adversarial Style Sampling for Assistive Tasks},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2024, Yokohama, Japan, May 13-17, 2024},
  pages        = {15158--15164},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/ICRA57147.2024.10611719},
  doi          = {10.1109/ICRA57147.2024.10611719},
  timestamp    = {Sun, 06 Oct 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OsaH24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/YoshimitsuOAI24,
  author       = {Yuhei Yoshimitsu and
                  Takayuki Osa and
                  Heni Ben Amor and
                  Shuhei Ikemoto},
  title        = {Active Learning for Forward/Inverse Kinematics of Redundantly-driven
                  Flexible Tensegrity Manipulator},
  booktitle    = {{IEEE/RSJ} International Conference on Intelligent Robots and Systems,
                  {IROS} 2024, Abu Dhabi, United Arab Emirates, October 14-18, 2024},
  pages        = {3512--3518},
  publisher    = {{IEEE}},
  year         = {2024},
  url          = {https://doi.org/10.1109/IROS58592.2024.10802310},
  doi          = {10.1109/IROS58592.2024.10802310},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iros/YoshimitsuOAI24.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-00344,
  author       = {Takayuki Osa and
                  Tatsuya Harada},
  title        = {Robustifying a Policy in Multi-Agent {RL} with Diverse Cooperative
                  Behaviors and Adversarial Style Sampling for Assistive Tasks},
  journal      = {CoRR},
  volume       = {abs/2403.00344},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.00344},
  doi          = {10.48550/ARXIV.2403.00344},
  eprinttype    = {arXiv},
  eprint       = {2403.00344},
  timestamp    = {Tue, 02 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-00344.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2403-07704,
  author       = {Motoki Omura and
                  Takayuki Osa and
                  Yusuke Mukuta and
                  Tatsuya Harada},
  title        = {Symmetric Q-learning: Reducing Skewness of Bellman Error in Online
                  Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2403.07704},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2403.07704},
  doi          = {10.48550/ARXIV.2403.07704},
  eprinttype    = {arXiv},
  eprint       = {2403.07704},
  timestamp    = {Thu, 04 Apr 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2403-07704.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2405-14114,
  author       = {Johannes Ackermann and
                  Takayuki Osa and
                  Masashi Sugiyama},
  title        = {Offline Reinforcement Learning from Datasets with Structured Non-Stationarity},
  journal      = {CoRR},
  volume       = {abs/2405.14114},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2405.14114},
  doi          = {10.48550/ARXIV.2405.14114},
  eprinttype    = {arXiv},
  eprint       = {2405.14114},
  timestamp    = {Wed, 19 Jun 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2405-14114.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-04896,
  author       = {Motoki Omura and
                  Takayuki Osa and
                  Yusuke Mukuta and
                  Tatsuya Harada},
  title        = {Stabilizing Extreme Q-learning by Maclaurin Expansion},
  journal      = {CoRR},
  volume       = {abs/2406.04896},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.04896},
  doi          = {10.48550/ARXIV.2406.04896},
  eprinttype    = {arXiv},
  eprint       = {2406.04896},
  timestamp    = {Sat, 13 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-04896.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2406-05993,
  author       = {Takayuki Osa and
                  Tatsuya Harada},
  title        = {Discovering Multiple Solutions from a Single Task in Offline Reinforcement
                  Learning},
  journal      = {CoRR},
  volume       = {abs/2406.05993},
  year         = {2024},
  url          = {https://doi.org/10.48550/arXiv.2406.05993},
  doi          = {10.48550/ARXIV.2406.05993},
  eprinttype    = {arXiv},
  eprint       = {2406.05993},
  timestamp    = {Sat, 13 Jul 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2406-05993.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/OsaOAH23,
  author       = {Takayuki Osa and
                  Naoto Osajima and
                  Masanori Aizawa and
                  Tatsuya Harada},
  title        = {Learning Adaptive Policies for Autonomous Excavation Under Various
                  Soil Conditions by Adversarial Domain Sampling},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {8},
  number       = {9},
  pages        = {5536--5543},
  year         = {2023},
  url          = {https://doi.org/10.1109/LRA.2023.3296933},
  doi          = {10.1109/LRA.2023.3296933},
  timestamp    = {Thu, 31 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/OsaOAH23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tmlr/OsaHDMY23,
  author       = {Takayuki Osa and
                  Akinobu Hayashi and
                  Pranav Deo and
                  Naoki Morihira and
                  Takahide Yoshiike},
  title        = {Offline Reinforcement Learning with Mixture of Deterministic Policies},
  journal      = {Trans. Mach. Learn. Res.},
  volume       = {2023},
  year         = {2023},
  url          = {https://openreview.net/forum?id=zkRCp4RmAF},
  timestamp    = {Thu, 01 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/tmlr/OsaHDMY23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/YoshimitsuOI23,
  author       = {Yuhei Yoshimitsu and
                  Takayuki Osa and
                  Shuhei Ikemoto},
  title        = {Forward/Inverse Kinematics Modeling for Tensegrity Manipulator Based
                  on Goal-Conditioned Variational Autoencoder},
  booktitle    = {{IROS}},
  pages        = {6668--6673},
  year         = {2023},
  url          = {https://doi.org/10.1109/IROS55552.2023.10341525},
  doi          = {10.1109/IROS55552.2023.10341525},
  timestamp    = {Sun, 04 Aug 2024 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/YoshimitsuOI23.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/access/OsaA22,
  author       = {Takayuki Osa and
                  Masanori Aizawa},
  title        = {Deep Reinforcement Learning With Adversarial Training for Automated
                  Excavation Using Depth Images},
  journal      = {{IEEE} Access},
  volume       = {10},
  pages        = {4523--4535},
  year         = {2022},
  url          = {https://doi.org/10.1109/ACCESS.2022.3140781},
  doi          = {10.1109/ACCESS.2022.3140781},
  timestamp    = {Tue, 08 Feb 2022 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/access/OsaA22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijrr/Osa22,
  author       = {Takayuki Osa},
  title        = {Motion planning by learning the solution manifold in trajectory optimization},
  journal      = {Int. J. Robotics Res.},
  volume       = {41},
  number       = {3},
  pages        = {281--311},
  year         = {2022},
  url          = {https://doi.org/10.1177/02783649211044405},
  doi          = {10.1177/02783649211044405},
  timestamp    = {Sun, 02 Oct 2022 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijrr/Osa22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/nn/OsaTS22,
  author       = {Takayuki Osa and
                  Voot Tangkaratt and
                  Masashi Sugiyama},
  title        = {Discovering diverse solutions in deep reinforcement learning by maximizing
                  state-action-based mutual information},
  journal      = {Neural Networks},
  volume       = {152},
  pages        = {90--104},
  year         = {2022},
  url          = {https://doi.org/10.1016/j.neunet.2022.04.009},
  doi          = {10.1016/J.NEUNET.2022.04.009},
  timestamp    = {Mon, 28 Aug 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/nn/OsaTS22.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/acml/HiraokaITOOT21,
  author       = {Takuya Hiraoka and
                  Takahisa Imagawa and
                  Voot Tangkaratt and
                  Takayuki Osa and
                  Takashi Onishi and
                  Yoshimasa Tsuruoka},
  editor       = {Vineeth N. Balasubramanian and
                  Ivor W. Tsang},
  title        = {Meta-Model-Based Meta-Policy Optimization},
  booktitle    = {Asian Conference on Machine Learning, {ACML} 2021, 17-19 November
                  2021, Virtual Event},
  series       = {Proceedings of Machine Learning Research},
  volume       = {157},
  pages        = {129--144},
  publisher    = {{PMLR}},
  year         = {2021},
  url          = {https://proceedings.mlr.press/v157/hiraoka21a.html},
  timestamp    = {Tue, 07 May 2024 20:11:56 +0200},
  biburl       = {https://dblp.org/rec/conf/acml/HiraokaITOOT21.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2103-07084,
  author       = {Takayuki Osa and
                  Voot Tangkaratt and
                  Masashi Sugiyama},
  title        = {Discovering Diverse Solutions in Deep Reinforcement Learning},
  journal      = {CoRR},
  volume       = {abs/2103.07084},
  year         = {2021},
  url          = {https://arxiv.org/abs/2103.07084},
  eprinttype    = {arXiv},
  eprint       = {2103.07084},
  timestamp    = {Wed, 24 Mar 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2103-07084.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2107-05842,
  author       = {Takayuki Osa},
  title        = {Motion Planning by Learning the Solution Manifold in Trajectory Optimization},
  journal      = {CoRR},
  volume       = {abs/2107.05842},
  year         = {2021},
  url          = {https://arxiv.org/abs/2107.05842},
  eprinttype    = {arXiv},
  eprint       = {2107.05842},
  timestamp    = {Wed, 21 Jul 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2107-05842.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijrr/Osa20,
  author       = {Takayuki Osa},
  title        = {Multimodal trajectory optimization for motion planning},
  journal      = {Int. J. Robotics Res.},
  volume       = {39},
  number       = {8},
  year         = {2020},
  url          = {https://doi.org/10.1177/0278364920918296},
  doi          = {10.1177/0278364920918296},
  timestamp    = {Thu, 29 Apr 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijrr/Osa20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/KarasawaKOFNO20,
  author       = {Hiroyuki Karasawa and
                  Tomohiro Kanemaki and
                  Kei Oomae and
                  Rui Fukui and
                  Masayuki Nakao and
                  Takayuki Osa},
  title        = {Hierarchical Stochastic Optimization With Application to Parameter
                  Tuning for Electronically Controlled Transmissions},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {5},
  number       = {2},
  pages        = {628--635},
  year         = {2020},
  url          = {https://doi.org/10.1109/LRA.2020.2965085},
  doi          = {10.1109/LRA.2020.2965085},
  timestamp    = {Fri, 22 May 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ral/KarasawaKOFNO20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/sncs/OsaI20,
  author       = {Takayuki Osa and
                  Shuehi Ikemoto},
  title        = {Goal-Conditioned Variational Autoencoder Trajectory Primitives with
                  Continuous and Discrete Latent Codes},
  journal      = {{SN} Comput. Sci.},
  volume       = {1},
  number       = {5},
  pages        = {303},
  year         = {2020},
  url          = {https://doi.org/10.1007/s42979-020-00324-7},
  doi          = {10.1007/S42979-020-00324-7},
  timestamp    = {Tue, 06 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/sncs/OsaI20.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2003-07054,
  author       = {Takayuki Osa},
  title        = {Multimodal Trajectory Optimization for Motion Planning},
  journal      = {CoRR},
  volume       = {abs/2003.07054},
  year         = {2020},
  url          = {https://arxiv.org/abs/2003.07054},
  eprinttype    = {arXiv},
  eprint       = {2003.07054},
  timestamp    = {Tue, 17 Mar 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2003-07054.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2006-02608,
  author       = {Takuya Hiraoka and
                  Takahisa Imagawa and
                  Voot Tangkaratt and
                  Takayuki Osa and
                  Takashi Onishi and
                  Yoshimasa Tsuruoka},
  title        = {Meta-Model-Based Meta-Policy Optimization},
  journal      = {CoRR},
  volume       = {abs/2006.02608},
  year         = {2020},
  url          = {https://arxiv.org/abs/2006.02608},
  eprinttype    = {arXiv},
  eprint       = {2006.02608},
  timestamp    = {Mon, 08 Jun 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2006-02608.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-2007-12397,
  author       = {Takayuki Osa},
  title        = {Learning the Solution Manifold in Optimization and Its Application
                  in Motion Planning},
  journal      = {CoRR},
  volume       = {abs/2007.12397},
  year         = {2020},
  url          = {https://arxiv.org/abs/2007.12397},
  eprinttype    = {arXiv},
  eprint       = {2007.12397},
  timestamp    = {Wed, 29 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-2007-12397.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iclr/OsaTS19,
  author       = {Takayuki Osa and
                  Voot Tangkaratt and
                  Masashi Sugiyama},
  title        = {Hierarchical Reinforcement Learning via Advantage-Weighted Information
                  Maximization},
  booktitle    = {7th International Conference on Learning Representations, {ICLR} 2019,
                  New Orleans, LA, USA, May 6-9, 2019},
  publisher    = {OpenReview.net},
  year         = {2019},
  url          = {https://openreview.net/forum?id=Hyl\_vjC5KQ},
  timestamp    = {Thu, 25 Jul 2019 13:03:15 +0200},
  biburl       = {https://dblp.org/rec/conf/iclr/OsaTS19.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1901-01365,
  author       = {Takayuki Osa and
                  Voot Tangkaratt and
                  Masashi Sugiyama},
  title        = {Hierarchical Reinforcement Learning via Advantage-Weighted Information
                  Maximization},
  journal      = {CoRR},
  volume       = {abs/1901.01365},
  year         = {2019},
  url          = {http://arxiv.org/abs/1901.01365},
  eprinttype    = {arXiv},
  eprint       = {1901.01365},
  timestamp    = {Thu, 31 Jan 2019 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1901-01365.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1910-01465,
  author       = {Johannes Ackermann and
                  Volker Gabler and
                  Takayuki Osa and
                  Masashi Sugiyama},
  title        = {Reducing Overestimation Bias in Multi-Agent Domains Using Double Centralized
                  Critics},
  journal      = {CoRR},
  volume       = {abs/1910.01465},
  year         = {2019},
  url          = {http://arxiv.org/abs/1910.01465},
  eprinttype    = {arXiv},
  eprint       = {1910.01465},
  timestamp    = {Fri, 04 Oct 2019 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1910-01465.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1912-04063,
  author       = {Takayuki Osa and
                  Shuhei Ikemoto},
  title        = {Variational Autoencoder Trajectory Primitives with Continuous and
                  Discrete Latent Codes},
  journal      = {CoRR},
  volume       = {abs/1912.04063},
  year         = {2019},
  url          = {http://arxiv.org/abs/1912.04063},
  eprinttype    = {arXiv},
  eprint       = {1912.04063},
  timestamp    = {Thu, 02 Jan 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1912-04063.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ar/OsaPN18,
  author       = {Takayuki Osa and
                  Jan Peters and
                  Gerhard Neumann},
  title        = {Hierarchical reinforcement learning of multiple grasping strategies
                  with human instructions},
  journal      = {Adv. Robotics},
  volume       = {32},
  number       = {18},
  pages        = {955--968},
  year         = {2018},
  url          = {https://doi.org/10.1080/01691864.2018.1509018},
  doi          = {10.1080/01691864.2018.1509018},
  timestamp    = {Sat, 25 Apr 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ar/OsaPN18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ftrob/OsaPNBA018,
  author       = {Takayuki Osa and
                  Joni Pajarinen and
                  Gerhard Neumann and
                  J. Andrew Bagnell and
                  Pieter Abbeel and
                  Jan Peters},
  title        = {An Algorithmic Perspective on Imitation Learning},
  journal      = {Found. Trends Robotics},
  volume       = {7},
  number       = {1-2},
  pages        = {1--179},
  year         = {2018},
  url          = {https://doi.org/10.1561/2300000053},
  doi          = {10.1561/2300000053},
  timestamp    = {Sun, 19 Jan 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ftrob/OsaPNBA018.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/tase/OsaSM18,
  author       = {Takayuki Osa and
                  Naohiko Sugita and
                  Mamoru Mitsuishi},
  title        = {Online Trajectory Planning and Force Control for Automation of Surgical
                  Tasks},
  journal      = {{IEEE} Trans Autom. Sci. Eng.},
  volume       = {15},
  number       = {2},
  pages        = {675--691},
  year         = {2018},
  url          = {https://doi.org/10.1109/TASE.2017.2676018},
  doi          = {10.1109/TASE.2017.2676018},
  timestamp    = {Mon, 26 Oct 2020 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/tase/OsaSM18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/aaai/OsaS18,
  author       = {Takayuki Osa and
                  Masashi Sugiyama},
  editor       = {Sheila A. McIlraith and
                  Kilian Q. Weinberger},
  title        = {Hierarchical Policy Search via Return-Weighted Density Estimation},
  booktitle    = {Proceedings of the Thirty-Second {AAAI} Conference on Artificial Intelligence,
                  (AAAI-18), the 30th innovative Applications of Artificial Intelligence
                  (IAAI-18), and the 8th {AAAI} Symposium on Educational Advances in
                  Artificial Intelligence (EAAI-18), New Orleans, Louisiana, USA, February
                  2-7, 2018},
  pages        = {3860--3867},
  publisher    = {{AAAI} Press},
  year         = {2018},
  url          = {https://doi.org/10.1609/aaai.v32i1.11706},
  doi          = {10.1609/AAAI.V32I1.11706},
  timestamp    = {Sat, 21 Oct 2023 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/aaai/OsaS18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/PinslerAO0N18,
  author       = {Robert Pinsler and
                  Riad Akrour and
                  Takayuki Osa and
                  Jan Peters and
                  Gerhard Neumann},
  title        = {Sample and Feedback Efficient Hierarchical Reinforcement Learning
                  from Human Preferences},
  booktitle    = {2018 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2018, Brisbane, Australia, May 21-25, 2018},
  pages        = {596--601},
  publisher    = {{IEEE}},
  year         = {2018},
  url          = {https://doi.org/10.1109/ICRA.2018.8460907},
  doi          = {10.1109/ICRA.2018.8460907},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/PinslerAO0N18.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1811-06711,
  author       = {Takayuki Osa and
                  Joni Pajarinen and
                  Gerhard Neumann and
                  J. Andrew Bagnell and
                  Pieter Abbeel and
                  Jan Peters},
  title        = {An Algorithmic Perspective on Imitation Learning},
  journal      = {CoRR},
  volume       = {abs/1811.06711},
  year         = {2018},
  url          = {http://arxiv.org/abs/1811.06711},
  eprinttype    = {arXiv},
  eprint       = {1811.06711},
  timestamp    = {Sun, 25 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1811-06711.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ral/OsaESL0N17,
  author       = {Takayuki Osa and
                  Amir Masoud Ghalamzan Esfahani and
                  Rustam Stolkin and
                  Rudolf Lioutikov and
                  Jan Peters and
                  Gerhard Neumann},
  title        = {Guiding Trajectory Optimization by Demonstrated Distributions},
  journal      = {{IEEE} Robotics Autom. Lett.},
  volume       = {2},
  number       = {2},
  pages        = {819--826},
  year         = {2017},
  url          = {https://doi.org/10.1109/LRA.2017.2653850},
  doi          = {10.1109/LRA.2017.2653850},
  timestamp    = {Mon, 03 Mar 2025 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/journals/ral/OsaESL0N17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/corl/MaedaEOB017,
  author       = {Guilherme Maeda and
                  Marco Ewerton and
                  Takayuki Osa and
                  Baptiste Busch and
                  Jan Peters},
  title        = {Active Incremental Learning of Robot Movement Primitives},
  booktitle    = {1st Annual Conference on Robot Learning, CoRL 2017, Mountain View,
                  California, USA, November 13-15, 2017, Proceedings},
  series       = {Proceedings of Machine Learning Research},
  volume       = {78},
  pages        = {37--46},
  publisher    = {{PMLR}},
  year         = {2017},
  url          = {http://proceedings.mlr.press/v78/maeda17a.html},
  timestamp    = {Wed, 03 Apr 2019 18:17:24 +0200},
  biburl       = {https://dblp.org/rec/conf/corl/MaedaEOB017.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/Abi-FarrajOPPNG17,
  author       = {Firas Abi{-}Farraj and
                  Takayuki Osa and
                  Nicolo Pedemonte and
                  Jan Peters and
                  Gerhard Neumann and
                  Paolo Robuffo Giordano},
  title        = {A learning-based shared control architecture for interactive task
                  execution},
  booktitle    = {2017 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2017, Singapore, Singapore, May 29 - June 3, 2017},
  pages        = {329--335},
  publisher    = {{IEEE}},
  year         = {2017},
  url          = {https://doi.org/10.1109/ICRA.2017.7989042},
  doi          = {10.1109/ICRA.2017.7989042},
  timestamp    = {Wed, 16 Oct 2019 14:14:51 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/Abi-FarrajOPPNG17.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/corr/abs-1711-10173,
  author       = {Takayuki Osa and
                  Masashi Sugiyama},
  title        = {Hierarchical Policy Search via Return-Weighted Density Estimation},
  journal      = {CoRR},
  volume       = {abs/1711.10173},
  year         = {2017},
  url          = {http://arxiv.org/abs/1711.10173},
  eprinttype    = {arXiv},
  eprint       = {1711.10173},
  timestamp    = {Mon, 13 Aug 2018 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/corr/abs-1711-10173.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iser/Osa0N16,
  author       = {Takayuki Osa and
                  Jan Peters and
                  Gerhard Neumann},
  editor       = {Dana Kulic and
                  Yoshihiko Nakamura and
                  Oussama Khatib and
                  Gentiane Venture},
  title        = {Experiments with Hierarchical Reinforcement Learning of Multiple Grasping
                  Policies},
  booktitle    = {International Symposium on Experimental Robotics, {ISER} 2016, Tokyo,
                  Japan, October 3-6, 2016},
  series       = {Springer Proceedings in Advanced Robotics},
  volume       = {1},
  pages        = {160--172},
  publisher    = {Springer},
  year         = {2016},
  url          = {https://doi.org/10.1007/978-3-319-50115-4\_15},
  doi          = {10.1007/978-3-319-50115-4\_15},
  timestamp    = {Fri, 02 Nov 2018 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/iser/Osa0N16.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OsaASCSIMTTM14,
  author       = {Takayuki Osa and
                  Christian Farid Abawi and
                  Naohiko Sugita and
                  Hirotaka Chikuda and
                  Shurei Sugita and
                  Hideya Ito and
                  Toru Moro and
                  Yoshio Takatori and
                  Sakae Tanaka and
                  Mamoru Mitsuishi},
  title        = {Autonomous penetration detection for bone cutting tool using demonstration-based
                  learning},
  booktitle    = {2014 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2014, Hong Kong, China, May 31 - June 7, 2014},
  pages        = {290--296},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICRA.2014.6906624},
  doi          = {10.1109/ICRA.2014.6906624},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OsaASCSIMTTM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/OsaHSM14,
  author       = {Takayuki Osa and
                  Kanako Harada and
                  Naohiko Sugita and
                  Mamoru Mitsuishi},
  title        = {Trajectory planning under different initial conditions for surgical
                  task automation by learning from demonstration},
  booktitle    = {2014 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2014, Hong Kong, China, May 31 - June 7, 2014},
  pages        = {6507--6513},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/ICRA.2014.6907819},
  doi          = {10.1109/ICRA.2014.6907819},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/OsaHSM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/OsaUSM14,
  author       = {Takayuki Osa and
                  Satoshi Uchida and
                  Naohiko Sugita and
                  Mamoru Mitsuishi},
  title        = {Hybrid control of master-slave velocity control and admittance control
                  for safe remote surgery},
  booktitle    = {2014 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2014, Chicago, IL, USA, September 14-18, 2014},
  pages        = {1328--1334},
  publisher    = {{IEEE}},
  year         = {2014},
  url          = {https://doi.org/10.1109/IROS.2014.6942729},
  doi          = {10.1109/IROS.2014.6942729},
  timestamp    = {Tue, 05 Sep 2023 15:07:47 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/OsaUSM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/rss/OsaSM14,
  author       = {Takayuki Osa and
                  Naohiko Sugita and
                  Mamoru Mitsuishi},
  editor       = {Dieter Fox and
                  Lydia E. Kavraki and
                  Hanna Kurniawati},
  title        = {Online Trajectory Planning in Dynamic Environments for Surgical Task
                  Automation},
  booktitle    = {Robotics: Science and Systems X, University of California, Berkeley,
                  USA, July 12-16, 2014},
  year         = {2014},
  url          = {http://www.roboticsproceedings.org/rss10/p11.html},
  doi          = {10.15607/RSS.2014.X.011},
  timestamp    = {Fri, 29 Jan 2021 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/rss/OsaSM14.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/OsaHHSM13,
  author       = {Takayuki Osa and
                  Takuto Haniu and
                  Kanako Harada and
                  Naohiko Sugita and
                  Mamoru Mitsuishi},
  title        = {Perforation risk detector using demonstration-based learning for teleoperated
                  robotic surgery},
  booktitle    = {2013 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, {IROS} 2013, Tokyo, Japan, November 3-7, 2013},
  pages        = {2572--2577},
  publisher    = {{IEEE}},
  year         = {2013},
  url          = {https://doi.org/10.1109/IROS.2013.6696719},
  doi          = {10.1109/IROS.2013.6696719},
  timestamp    = {Tue, 05 Sep 2023 15:06:24 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/OsaHHSM13.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icas/StaubKOB10,
  author       = {Christoph Staub and
                  Alois C. Knoll and
                  Takayuki Osa and
                  Robert Bauernschmitt},
  title        = {Autonomous High Precision Positioning of Surgical Instruments in Robot-Assisted
                  Minimally Invasive Surgery under Visual Guidance},
  booktitle    = {Sixth International Conference on Autonomic and Autonomous Systems,
                  {ICAS} 2010, Cancun, Mexico, March 7-13, 2010},
  pages        = {64--69},
  publisher    = {{IEEE} Computer Society},
  year         = {2010},
  url          = {https://doi.org/10.1109/ICAS.2010.18},
  doi          = {10.1109/ICAS.2010.18},
  timestamp    = {Thu, 23 Mar 2023 00:00:00 +0100},
  biburl       = {https://dblp.org/rec/conf/icas/StaubKOB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/StaubOKB10,
  author       = {Christoph Staub and
                  Takayuki Osa and
                  Alois C. Knoll and
                  Robert Bauernschmitt},
  title        = {Automation of tissue piercing using circular needles and vision guidance
                  for computer aided laparoscopic surgery},
  booktitle    = {{IEEE} International Conference on Robotics and Automation, {ICRA}
                  2010, Anchorage, Alaska, USA, 3-7 May 2010},
  pages        = {4585--4590},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/ROBOT.2010.5509601},
  doi          = {10.1109/ROBOT.2010.5509601},
  timestamp    = {Wed, 19 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/StaubOKB10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/OndaOSHM10,
  author       = {Kazushi Onda and
                  Takayuki Osa and
                  Naohiko Sugita and
                  Makoto Hashizume and
                  Mamoru Mitsuishi},
  title        = {Asynchronous force and visual feedback in teleoperative laparoscopic
                  surgical system},
  booktitle    = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 18-22, 2010, Taipei, Taiwan},
  pages        = {844--849},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/IROS.2010.5650727},
  doi          = {10.1109/IROS.2010.5650727},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/OndaOSHM10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/iros/OsaSK10,
  author       = {Takayuki Osa and
                  Christoph Staub and
                  Alois C. Knoll},
  title        = {Framework of automatic robot surgery system using Visual servoing},
  booktitle    = {2010 {IEEE/RSJ} International Conference on Intelligent Robots and
                  Systems, October 18-22, 2010, Taipei, Taiwan},
  pages        = {1837--1842},
  publisher    = {{IEEE}},
  year         = {2010},
  url          = {https://doi.org/10.1109/IROS.2010.5650301},
  doi          = {10.1109/IROS.2010.5650301},
  timestamp    = {Wed, 19 May 2021 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/iros/OsaSK10.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@article{DBLP:journals/ijat/SugitaNONFAOSM09,
  author       = {Naohiko Sugita and
                  Taiga Nakano and
                  Takayuki Osa and
                  Yoshikazu Nakajima and
                  Kazuo Fujiwara and
                  Nobuhiro Abe and
                  Toshifumi Ozaki and
                  Masahiko Suzuki and
                  Mamoru Mitsuishi},
  title        = {Cutting Tool Protects for Soft Tissues in Bone-Milling Machining},
  journal      = {Int. J. Autom. Technol.},
  volume       = {3},
  number       = {2},
  pages        = {185--192},
  year         = {2009},
  url          = {https://doi.org/10.20965/ijat.2009.p0185},
  doi          = {10.20965/IJAT.2009.P0185},
  timestamp    = {Thu, 09 Jul 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/journals/ijat/SugitaNONFAOSM09.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}
@inproceedings{DBLP:conf/icra/SugitaONM08,
  author       = {Naohiko Sugita and
                  Takayuki Osa and
                  Yoshikazu Nakajima and
                  Mamoru Mitsuishi},
  title        = {Deformation analysis and active compensation of surgical milling robot
                  based on system error evaluation},
  booktitle    = {2008 {IEEE} International Conference on Robotics and Automation, {ICRA}
                  2008, May 19-23, 2008, Pasadena, California, {USA}},
  pages        = {3389--3394},
  publisher    = {{IEEE}},
  year         = {2008},
  url          = {https://doi.org/10.1109/ROBOT.2008.4543728},
  doi          = {10.1109/ROBOT.2008.4543728},
  timestamp    = {Sun, 25 Oct 2020 01:00:00 +0200},
  biburl       = {https://dblp.org/rec/conf/icra/SugitaONM08.bib},
  bibsource    = {dblp computer science bibliography, https://dblp.org}
}