@misc{8821c826d8154eca8ce1edaa1cb83189,
title = "Intelligent Agents (in English): Agents, Mechanisms, and Collaboration / Agent Perception: Language and Vision / Actions Planning, Reinforcement-Learning / Causality (40 Vorlesungen, Universit{\"a}t zu L{\"u}beck 2019-2024)",
abstract = "Agents, Mechanisms, and Collaborationo Intelligent agents and artificial intelligenceo Game theory and social choiceo Mechanism design, algorithmic mechanism designo Agent collaboration, rules of encountero Epistemic logic introo Knowledge and seeingo Knowledge and timeo Dynamic epistemic logico Doxastic Logico Justification Logico Knowledge Based programso Excursion Fourier Analysis (Proof of Arrows Theorem)Perception of Agents (Language and Vision)o Information retrieval and web-mining agentso Probabilistic dimension reduction, latent content descriptions, topic models, LDAo Representation learning for sequential structures, embedding spaces, word2vec, CBOW, skip-gram, hierarchical softmax, negative samplingo Multi-relational latent semantic analysiso Language models (1d-CNNs, RNNs, LSTMs, ELMo, Transformers, BERT, GPT-3, T5, and beyond), natural language inference and query answering, reinforcement learning (InstructGPT), in-context learning, ChatGPTo LaMDA, Grounding, embedding knowledge graphs into language models, GNNs o Vision and Language (2D-CNNs: AlexNet, ResNet / Transfer Learning / ViLBERT / CLIP)o Generative vision models (DALL-E and beyond) VQ-VAE/d-VAE, DALL-E's transformero Summary: Agents and PerceptionActions of Agents (Planning, Causality, and Reinforcement Learning)o Introduction (Agent, planning, and acting)o Deterministic (State-variable representation, forward state-space search, heuristic functions, backward search, and plan-space search)o Temporal (Temporal representation, planning with temporal models, constraint management, and acting with temporal models)o Nondeterministic (Planning problem, and/or graph search, determination, and online approaches)o Probabilistic (Stochastic shortest-path problems, heuristic search algorithms, and online approaches including reinforcement learning)o Decision Making - Foundations (Utility theory, Markov decision processes, and reinforcement learning) - Extensions (Partially observable MDPs and decentralised POMDPs) - Structure (Lifted DecPOMDPs, Factored MDPs, and first-order MDPs)o Human-aware (Mental models, interpretable behaviour, and explanations)Causalityo Introduction to causal representations, causal leanringo Interventiono Instrumental variableso Counterfactuals",
author = "Ralf M{\"o}ller and Tanya Braun and Marcel Gehrke and {\"O}zg{\"u}r {\"O}z{\c c}ep",
year = "2024",
language = "English",
type = "Other",
}