% Encoding: UTF-8 @Misc{RoboSkate, author = {Matas Sakalauskas}, month = oct, title = {{RoboSkate}}, year = {2020}, owner = {STEAM}, timestamp = {2021-08-30}, url = {https://store.steampowered.com/app/1404530/RoboSkate/}, } @Misc{unityRL, author = {Juliani, Arthur and Berges, Vincent-Pierre and Teng, Ervin and Cohen, Andrew and Harper, Jonathan and Elion, Chris and Goy, Chris and Gao, Yuan and Henry, Hunter and Mattar, Marwan and Lange, D.}, title = {{Unity: A General Platform for Intelligent Agents}}, year = {2020}, journal = {arXiv preprint arXiv:1809.02627}, timestamp = {2021-08-30}, url = {https://github.com/Unity-Technologies/ml-agents}, } @Manual{unityHeadless, title = {{Unity Manual}}, month = aug, year = {2021}, owner = {Unity}, timestamp = {2021-08-30}, url = {https://docs.unity3d.com/Manual/CommandLineArguments.html}, } @Article{unitywithoutMonitor, author = {Renaldas Zioma}, journal = {Towards Data Science}, title = {{How to run Unity on Amazon Cloud or without Monitor}}, year = {2017}, month = aug, owner = {Renaldas Zioma}, timestamp = {2021-08-30}, url = {https://towardsdatascience.com/how-to-run-unity-on-amazon-cloud-or-without-monitor-3c10ce022639}, } @Misc{nvidiagpucontainersruntime, title = {NVIDIA container runtime}, timestamp = {2021-08-30}, url = {https://github.com/NVIDIA/nvidia-container-runtime}, } @Manual{ServerGUI, title = {{ServerGUI}}, author = {Neal McBurnett}, month = sep, year = {2012}, url = {https://help.ubuntu.com/community/ServerGUI}, } @Misc{nvidiavulkan, title = {nvidia/vulkan}, owner = {NVIDEA}, timestamp = {2021-08-30}, url = {https://hub.docker.com/r/nvidia/vulkan}, } @Misc{SB3, author = {Raffin, Antonin and Hill, Ashley and Enerstus, Maximilian and Gleave, Adam and Kanervisto, Anssi and Dormann, Noah}, month = {5}, title = {{Stable Baselines3}}, year = {2020}, timestamp = {2021-08-30}, url = {https://github.com/DLR-RM/stable-baselines3}, } @Misc{imitation, author = {Wang, Steven and Toyer, Sam and Gleave, Adam and Emmons, Scott}, howpublished = {\url{https://github.com/HumanCompatibleAI/imitation}}, title = {The {\tt imitation} Library for Imitation Learning and Inverse Reinforcement Learning}, year = {2020}, journal = {GitHub repository}, publisher = {GitHub}, } @Article{badrinarayanan2016segnet, author = {Badrinarayanan, Vijay and Kendall, Alex and Cipolla, Roberto}, journal = {IEEE transactions on pattern analysis and machine intelligence}, title = {Segnet: A deep convolutional encoder-decoder architecture for image segmentation}, year = {2017}, number = {12}, pages = {2481--2495}, volume = {39}, publisher = {IEEE}, } @Misc{Playthrough, author = {Matas Sakalauskas}, month = oct, title = {{RoboSkate Developer Playthrough}}, year = {2020}, timestamp = {2021-08-30}, url = {https://www.youtube.com/watch?v=_BWT11ttgJ4&t=117s&ab_channel=MatasSakalauskas}, } @InBook{Watershed, author = {Preim, Bernhard and Botha, Charl P.}, chapter = {4.3.5 Watershed Segmentation}, pages = {129--131}, publisher = {Newnes}, title = {Visual computing for medicine: theory, algorithms, and applications}, year = {2013}, url = {https://www.sciencedirect.com/topics/computer-science/watershed-segmentation}, } @Article{Watershed2, author = {Strahinja Zivkovic}, journal = {Data Hacker}, title = {{OpenCV projects – Image segmentation with Watershed algorithm}}, year = {2020}, month = dec, timestamp = {2021-08-30}, url = {http://datahacker.rs/007-opencv-projects-image-segmentation-with-watershed-algorithm/}, } @Article{ImageProcessing, author = {Prince Canuma}, journal = {Medium}, title = {{Image Pre-processing}}, year = {2018}, month = oct, timestamp = {2021-08-30}, url = {https://prince-canuma.medium.com/image-pre-processing-c1aec0be3edf}, } @Manual{Canny, title = {Canny edge detector}, timestamp = {2021-08-30}, url = {https://scikit-image.org/docs/dev/auto_examples/edges/plot_canny.html}, } @Article{Curse_of_Dimensionality, author = {Bellman, Richard}, journal = {Science}, title = {Dynamic programming}, year = {1966}, number = {3731}, pages = {34--37}, volume = {153}, publisher = {American Association for the Advancement of Science}, } @Book{sutton2018reinforcement, author = {Sutton, Richard S. and Barto, Andrew G.}, publisher = {MIT press}, title = {Reinforcement learning: An introduction}, year = {2018}, } @Article{schulman2017proximal, author = {Schulman, John and Wolski, Filip and Dhariwal, Prafulla and Radford, Alec and Klimov, Oleg}, journal = {arXiv preprint arXiv:1707.06347}, title = {Proximal policy optimization algorithms}, year = {2017}, } @Manual{NRP, title = {{Neurorobotics Platform}}, url = {https://neurorobotics.net/Documentation/nrp/index.html}, } @Article{wang2019boosting, author = {Wang, Che and Ross, Keith}, journal = {arXiv preprint arXiv:1906.04009}, title = {Boosting soft actor-critic: Emphasizing recent experience without forgetting the past}, year = {2019}, } @InProceedings{zhou2019continuity, author = {Zhou, Yi and Barnes, Connelly and Lu, Jingwan and Yang, Jimei and Li, Hao}, booktitle = {Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition}, title = {On the continuity of rotation representations in neural networks}, year = {2019}, pages = {5745--5753}, } @Article{Saha2018, author = {Sumit Saha}, journal = {Towards Data Science}, title = {{A Comprehensive Guide to Convolutional Neural Networks — the ELI5 way}}, year = {2018}, month = dec, timestamp = {2021-08-30}, url = {https://towardsdatascience.com/a-comprehensive-guide-to-convolutional-neural-networks-the-eli5-way-3bd2b1164a53}, } @Article{Daaboul2020, author = {Karam Daaboul}, journal = {Medium}, title = {{Reinforcement Learning: Dealing with Sparse Reward Environments}}, year = {2020}, month = aug, url = {https://medium.com/@m.k.daaboul/dealing-with-sparse-reward-environments-38c0489c844d}, } @Article{Bonsai2017, author = {Bonsai}, journal = {Medium}, title = {{Deep Reinforcement Learning Models: Tips & Tricks for Writing Reward Functions}}, year = {2017}, month = nov, url = {https://medium.com/@BonsaiAI/deep-reinforcement-learning-models-tips-tricks-for-writing-reward-functions-a84fe525e8e0}, } @Article{gudimella2017deep, author = {Gudimella, Aditya and Story, Ross and Shaker, Matineh and Kong, Ruofan and Brown, Matthew and Shnayder, Victor and Campos, Marcos}, journal = {arXiv preprint arXiv:1709.06977}, title = {Deep reinforcement learning for dexterous manipulation with concept networks}, year = {2017}, } @Article{Raffin2019, author = {Antonin Raffin}, journal = {Towards Data Science}, title = {{Learning to Drive Smoothly in Minutes}}, year = {2019}, month = jan, } @InProceedings{mnih2016asynchronous, author = {Mnih, Volodymyr and Badia, Adria Puigdomenech and Mirza, Mehdi and Graves, Alex and Lillicrap, Timothy and Harley, Tim and Silver, David and Kavukcuoglu, Koray}, booktitle = {International conference on machine learning}, title = {Asynchronous methods for deep reinforcement learning}, year = {2016}, organization = {PMLR}, pages = {1928--1937}, } @Article{haarnoja2018soft, author = {Haarnoja, Tuomas and Zhou, Aurick and Hartikainen, Kristian and Tucker, George and Ha, Sehoon and Tan, Jie and Kumar, Vikash and Zhu, Henry and Gupta, Abhishek and Abbeel, Pieter and others}, journal = {arXiv preprint arXiv:1812.05905}, title = {Soft actor-critic algorithms and applications}, year = {2018}, } @Article{mnih2013playing, author = {Mnih, Volodymyr and Kavukcuoglu, Koray and Silver, David and Graves, Alex and Antonoglou, Ioannis and Wierstra, Daan and Riedmiller, Martin}, journal = {arXiv preprint arXiv:1312.5602}, title = {Playing atari with deep reinforcement learning}, year = {2013}, } @Article{fu2017learning, author = {Fu, Justin and Luo, Katie and Levine, Sergey}, journal = {arXiv preprint arXiv:1710.11248}, title = {Learning robust rewards with adversarial inverse reinforcement learning}, year = {2017}, } @Article{ho2016generative, author = {Ho, Jonathan and Ermon, Stefano}, journal = {Advances in neural information processing systems}, title = {Generative adversarial imitation learning}, year = {2016}, pages = {4565--4573}, volume = {29}, } @Comment{jabref-meta: databaseType:bibtex;}