@misc{PanzerBenderGronau2022,
  author    = {Panzer, Marcel and Bender, Benedict and Gronau, Norbert},
  title     = {Neural agent-based production planning and control},
  series = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Wirtschafts- und Sozialwissenschaftliche Reihe},
  journal   = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Wirtschafts- und Sozialwissenschaftliche Reihe},
  issn      = {1867-5808},
  doi       = {10.25932/publishup-60477},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-604777},
  pages     = {26},
  year      = {2022},
  abstract  = {Nowadays, production planning and control must cope with mass customization, increased fluctuations in demand, and high competition pressures. Despite prevailing market risks, planning accuracy and increased adaptability in the event of disruptions or failures must be ensured, while simultaneously optimizing key process indicators. To manage that complex task, neural networks that can process large quantities of high-dimensional data in real time have been widely adopted in recent years. Although these are already extensively deployed in production systems, a systematic review of applications and implemented agent embeddings and architectures has not yet been conducted. The main contribution of this paper is to provide researchers and practitioners with an overview of applications and applied embeddings and to motivate further research in neural agent-based production. Findings indicate that neural agents are not only deployed in diverse applications, but are also increasingly implemented in multi-agent environments or in combination with conventional methods — leveraging performances compared to benchmarks and reducing dependence on human experience. This not only implies a more sophisticated focus on distributed production resources, but also broadening the perspective from a local to a global scale. Nevertheless, future research must further increase scalability and reproducibility to guarantee a simplified transfer of results to reality.},
  language  = {en}
}
@article{PanzerBenderGronau2022,
  author    = {Panzer, Marcel and Bender, Benedict and Gronau, Norbert},
  title     = {Neural agent-based production planning and control},
  series = {Journal of Manufacturing Systems},
  volume    = {65},
  journal   = {Journal of Manufacturing Systems},
  publisher = {Elsevier},
  address   = {Amsterdam},
  issn      = {0278-6125},
  doi       = {10.1016/j.jmsy.2022.10.019},
  pages     = {743 -- 766},
  year      = {2022},
  abstract  = {Nowadays, production planning and control must cope with mass customization, increased fluctuations in demand, and high competition pressures. Despite prevailing market risks, planning accuracy and increased adaptability in the event of disruptions or failures must be ensured, while simultaneously optimizing key process indicators. To manage that complex task, neural networks that can process large quantities of high-dimensional data in real time have been widely adopted in recent years. Although these are already extensively deployed in production systems, a systematic review of applications and implemented agent embeddings and architectures has not yet been conducted. The main contribution of this paper is to provide researchers and practitioners with an overview of applications and applied embeddings and to motivate further research in neural agent-based production. Findings indicate that neural agents are not only deployed in diverse applications, but are also increasingly implemented in multi-agent environments or in combination with conventional methods — leveraging performances compared to benchmarks and reducing dependence on human experience. This not only implies a more sophisticated focus on distributed production resources, but also broadening the perspective from a local to a global scale. Nevertheless, future research must further increase scalability and reproducibility to guarantee a simplified transfer of results to reality.},
  language  = {en}
}
@misc{Panzer2023,
  author    = {Panzer, Marcel},
  title     = {Factory Innovation Award},
  series = {Factory Innovation : agil und smart mit Industrie 4.0},
  journal   = {Factory Innovation : agil und smart mit Industrie 4.0},
  number    = {3},
  publisher = {GITO mbH - Verlag f{\"u}r Industrielle Informationstechnik und Organisation},
  address   = {Berlin},
  issn      = {2749-7593},
  pages     = {8 -- 11},
  year      = {2023},
  abstract  = {Einmal mehr brachte die Hannover Messe die Spitzen der Industrie zusammen, um die wegweisenden Innovationen des Jahres mit dem begehrten Factory Innovation Award 2023 zu ehren. Dieser renommierte Preis, der erstmals auf der Industrial Transformation Stage verliehen wurde, markierte den H{\"o}hepunkt einer spannungsgeladenen Veranstaltung.},
  language  = {de}
}
@article{PanzerGronau2024,
  author    = {Panzer, Marcel and Gronau, Norbert},
  title     = {Enhancing economic efficiency in modular production systems through deep reinforcement learning},
  series = {Procedia CIRP},
  volume    = {121},
  journal   = {Procedia CIRP},
  publisher = {Elsevier},
  address   = {Amsterdam},
  issn      = {2212-8271},
  doi       = {10.1016/j.procir.2023.09.229},
  pages     = {55 -- 60},
  year      = {2024},
  abstract  = {In times of increasingly complex production processes and volatile customer demands, the production adaptability is crucial for a company's profitability and competitiveness. The ability to cope with rapidly changing customer requirements and unexpected internal and external events guarantees robust and efficient production processes, requiring a dedicated control concept at the shop floor level. Yet in today's practice, conventional control approaches remain in use, which may not keep up with the dynamic behaviour due to their scenario-specific and rigid properties. To address this challenge, deep learning methods were increasingly deployed due to their optimization and scalability properties. However, these approaches were often tested in specific operational applications and focused on technical performance indicators such as order tardiness or total throughput. In this paper, we propose a deep reinforcement learning based production control to optimize combined techno-financial performance measures. Based on pre-defined manufacturing modules that are supplied and operated by multiple agents, positive effects were observed in terms of increased revenue and reduced penalties due to lower throughput times and fewer delayed products. The combined modular and multi-staged approach as well as the distributed decision-making further leverage scalability and transferability to other scenarios.},
  language  = {en}
}
@phdthesis{Panzer2024,
  author    = {Panzer, Marcel},
  title     = {Design of a hyper-heuristics based control framework for modular production systems},
  doi       = {10.25932/publishup-63300},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-633006},
  school      = {Universit{\"a}t Potsdam},
  pages     = {vi, 334},
  year      = {2024},
  abstract  = {Volatile supply and sales markets, coupled with increasing product individualization and complex production processes, present significant challenges for manufacturing companies. These must navigate and adapt to ever-shifting external and internal factors while ensuring robustness against process variabilities and unforeseen events. This has a pronounced impact on production control, which serves as the operational intersection between production planning and the shop- floor resources, and necessitates the capability to manage intricate process interdependencies effectively. Considering the increasing dynamics and product diversification, alongside the need to maintain constant production performances, the implementation of innovative control strategies becomes crucial. In recent years, the integration of Industry 4.0 technologies and machine learning methods has gained prominence in addressing emerging challenges in production applications. Within this context, this cumulative thesis analyzes deep learning based production systems based on five publications. Particular attention is paid to the applications of deep reinforcement learning, aiming to explore its potential in dynamic control contexts. Analysis reveal that deep reinforcement learning excels in various applications, especially in dynamic production control tasks. Its efficacy can be attributed to its interactive learning and real-time operational model. However, despite its evident utility, there are notable structural, organizational, and algorithmic gaps in the prevailing research. A predominant portion of deep reinforcement learning based approaches is limited to specific job shop scenarios and often overlooks the potential synergies in combined resources. Furthermore, it highlights the rare implementation of multi-agent systems and semi-heterarchical systems in practical settings. A notable gap remains in the integration of deep reinforcement learning into a hyper-heuristic. To bridge these research gaps, this thesis introduces a deep reinforcement learning based hyper- heuristic for the control of modular production systems, developed in accordance with the design science research methodology. Implemented within a semi-heterarchical multi-agent framework, this approach achieves a threefold reduction in control and optimisation complexity while ensuring high scalability, adaptability, and robustness of the system. In comparative benchmarks, this control methodology outperforms rule-based heuristics, reducing throughput times and tardiness, and effectively incorporates customer and order-centric metrics. The control artifact facilitates a rapid scenario generation, motivating for further research efforts and bridging the gap to real-world applications. The overarching goal is to foster a synergy between theoretical insights and practical solutions, thereby enriching scientific discourse and addressing current industrial challenges.},
  language  = {en}
}
@article{PanzerBender2021,
  author    = {Panzer, Marcel and Bender, Benedict},
  title     = {Deep reinforcement learning in production systems},
  series = {International Journal of Production Research},
  volume    = {13},
  journal   = {International Journal of Production Research},
  number    = {60},
  publisher = {Taylor \& Francis},
  address   = {London},
  issn      = {1366-588X},
  doi       = {10.1080/00207543.2021.1973138},
  year      = {2021},
  abstract  = {Shortening product development cycles and fully customizable products pose major challenges for production systems. These not only have to cope with an increased product diversity but also enable high throughputs and provide a high adaptability and robustness to process variations and unforeseen incidents. To overcome these challenges, deep Reinforcement Learning (RL) has been increasingly applied for the optimization of production systems. Unlike other machine learning methods, deep RL operates on recently collected sensor-data in direct interaction with its environment and enables real-time responses to system changes. Although deep RL is already being deployed in production systems, a systematic review of the results has not yet been established. The main contribution of this paper is to provide researchers and practitioners an overview of applications and to motivate further implementations and research of deep RL supported production systems. Findings reveal that deep RL is applied in a variety of production domains, contributing to data-driven and flexible processes. In most applications, conventional methods were outperformed and implementation efforts or dependence on human experience were reduced. Nevertheless, future research must focus more on transferring the findings to real-world systems to analyze safety aspects and demonstrate reliability under prevailing conditions.},
  language  = {en}
}
@misc{PanzerBenderGronau2021,
  author    = {Panzer, Marcel and Bender, Benedict and Gronau, Norbert},
  title     = {Deep reinforcement learning in production planning and control},
  series = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Wirtschafts- und Sozialwissenschaftliche Reihe},
  journal   = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Wirtschafts- und Sozialwissenschaftliche Reihe},
  issn      = {2701-6277},
  doi       = {10.25932/publishup-60572},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-605722},
  pages     = {13},
  year      = {2021},
  abstract  = {Increasingly fast development cycles and individualized products pose major challenges for today's smart production systems in times of industry 4.0. The systems must be flexible and continuously adapt to changing conditions while still guaranteeing high throughputs and robustness against external disruptions. Deep reinforcement learning (RL) algorithms, which already reached impressive success with Google DeepMind's AlphaGo, are increasingly transferred to production systems to meet related requirements. Unlike supervised and unsupervised machine learning techniques, deep RL algorithms learn based on recently collected sensorand process-data in direct interaction with the environment and are able to perform decisions in real-time. As such, deep RL algorithms seem promising given their potential to provide decision support in complex environments, as production systems, and simultaneously adapt to changing circumstances. While different use-cases for deep RL emerged, a structured overview and integration of findings on their application are missing. To address this gap, this contribution provides a systematic literature review of existing deep RL applications in the field of production planning and control as well as production logistics. From a performance perspective, it became evident that deep RL can beat heuristics significantly in their overall performance and provides superior solutions to various industrial use-cases. Nevertheless, safety and reliability concerns must be overcome before the widespread use of deep RL is possible which presumes more intensive testing of deep RL in real world applications besides the already ongoing intensive simulations.},
  language  = {en}
}
@inproceedings{PanzerBenderGronau2021,
  author    = {Panzer, Marcel and Bender, Benedict and Gronau, Norbert},
  title     = {Deep reinforcement learning in production planning and control},
  series = {Proceedings of the Conference on Production Systems and Logistics},
  booktitle = {Proceedings of the Conference on Production Systems and Logistics},
  publisher = {publish-Ing.},
  address   = {Hannover},
  issn      = {2701-6277},
  doi       = {10.15488/11238},
  pages     = {535 -- 545},
  year      = {2021},
  abstract  = {Increasingly fast development cycles and individualized products pose major challenges for today's smart production systems in times of industry 4.0. The systems must be flexible and continuously adapt to changing conditions while still guaranteeing high throughputs and robustness against external disruptions. Deep rein- forcement learning (RL) algorithms, which already reached impressive success with Google DeepMind's AlphaGo, are increasingly transferred to production systems to meet related requirements. Unlike supervised and unsupervised machine learning techniques, deep RL algorithms learn based on recently collected sensor- and process-data in direct interaction with the environment and are able to perform decisions in real-time. As such, deep RL algorithms seem promising given their potential to provide decision support in complex environments, as production systems, and simultaneously adapt to changing circumstances. While different use-cases for deep RL emerged, a structured overview and integration of findings on their application are missing. To address this gap, this contribution provides a systematic literature review of existing deep RL applications in the field of production planning and control as well as production logistics. From a performance perspective, it became evident that deep RL can beat heuristics significantly in their overall performance and provides superior solutions to various industrial use-cases. Nevertheless, safety and reliability concerns must be overcome before the widespread use of deep RL is possible which presumes more intensive testing of deep RL in real world applications besides the already ongoing intensive simulations.},
  language  = {en}
}
@misc{PanzerBenderGronau2023,
  author    = {Panzer, Marcel and Bender, Benedict and Gronau, Norbert},
  title     = {A deep reinforcement learning based hyper-heuristic for modular production control},
  series = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Wirtschafts- und Sozialwissenschaftliche Reihe},
  journal   = {Zweitver{\"o}ffentlichungen der Universit{\"a}t Potsdam : Wirtschafts- und Sozialwissenschaftliche Reihe},
  issn      = {1867-5808},
  doi       = {10.25932/publishup-60564},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-605642},
  pages     = {24},
  year      = {2023},
  abstract  = {In nowadays production, fluctuations in demand, shortening product life-cycles, and highly configurable products require an adaptive and robust control approach to maintain competitiveness. This approach must not only optimise desired production objectives but also cope with unforeseen machine failures, rush orders, and changes in short-term demand. Previous control approaches were often implemented using a single operations layer and a standalone deep learning approach, which may not adequately address the complex organisational demands of modern manufacturing systems. To address this challenge, we propose a hyper-heuristics control model within a semi-heterarchical production system, in which multiple manufacturing and distribution agents are spread across pre-defined modules. The agents employ a deep reinforcement learning algorithm to learn a policy for selecting low-level heuristics in a situation-specific manner, thereby leveraging system performance and adaptability. We tested our approach in simulation and transferred it to a hybrid production environment. By that, we were able to demonstrate its multi-objective optimisation capabilities compared to conventional approaches in terms of mean throughput time, tardiness, and processing of prioritised orders in a multi-layered production system. The modular design is promising in reducing the overall system complexity and facilitates a quick and seamless integration into other scenarios.},
  language  = {en}
}
@article{PanzerBenderGronau2023,
  author    = {Panzer, Marcel and Bender, Benedict and Gronau, Norbert},
  title     = {A deep reinforcement learning based hyper-heuristic for modular production control},
  series = {International journal of production research},
  journal   = {International journal of production research},
  publisher = {Taylor \& Francis},
  address   = {London},
  issn      = {0020-7543},
  doi       = {10.1080/00207543.2023.2233641},
  pages     = {1 -- 22},
  year      = {2023},
  abstract  = {In nowadays production, fluctuations in demand, shortening product life-cycles, and highly configurable products require an adaptive and robust control approach to maintain competitiveness. This approach must not only optimise desired production objectives but also cope with unforeseen machine failures, rush orders, and changes in short-term demand. Previous control approaches were often implemented using a single operations layer and a standalone deep learning approach, which may not adequately address the complex organisational demands of modern manufacturing systems. To address this challenge, we propose a hyper-heuristics control model within a semi-heterarchical production system, in which multiple manufacturing and distribution agents are spread across pre-defined modules. The agents employ a deep reinforcement learning algorithm to learn a policy for selecting low-level heuristics in a situation-specific manner, thereby leveraging system performance and adaptability. We tested our approach in simulation and transferred it to a hybrid production environment. By that, we were able to demonstrate its multi-objective optimisation capabilities compared to conventional approaches in terms of mean throughput time, tardiness, and processing of prioritised orders in a multi-layered production system. The modular design is promising in reducing the overall system complexity and facilitates a quick and seamless integration into other scenarios.},
  language  = {en}
}