robertfeldt · Amir-Mehrpanah · Dec 16, 2024
diff --git a/assignments/2024/mehrpanah_amir/WASP_SE_M2.pdf b/assignments/2024/mehrpanah_amir/WASP_SE_M2.pdf
diff --git a/assignments/2024/mehrpanah_amir/bib.bib b/assignments/2024/mehrpanah_amir/bib.bib
@@ -0,0 +1,35 @@
+@inproceedings{pp1,
+author = {Nguyen, Minh-Tri and Truong, Hong-Linh and Truong-Huu, Tram},
+title = {Novel Contract-based Runtime Explainability Framework for End-to-End Ensemble Machine Learning Serving},
+year = {2024},
+isbn = {9798400705915},
+publisher = {Association for Computing Machinery},
+address = {New York, NY, USA},
+url = {https://doi.org/10.1145/3644815.3644964},
+doi = {10.1145/3644815.3644964},
+abstract = {The growing complexity of end-to-end Machine Learning (ML) serving across the edge-cloud continuum has raised the necessity for runtime explainability to support service optimizations, transparency, and trustworthiness. That involves many challenges in managing ML service quality and engineering runtime explainability based on ML service contracts. Currently, consumers use ML services almost as a black box with insufficient explainability for not only inference decisions but also other contractual aspects, such as data/service quality and costs. The generic explainability for ML models is inadequate to explain the runtime ML usage for individual consumers. Moreover, ML-specific metrics have not been addressed in existing service contracts. In this work, we introduce a novel contract-based runtime explainability framework for end-to-end ensemble ML serving. The framework provides a comprehensive engineering toolset, including explainability constraints in ML contracts, report schemas, and interactions between ML consumers and the components of the ML serving for evaluating service quality with contract-based explanations. We develop new monitoring probes to measure ML-specific metrics on data quality, inference confidence, inference accuracy, and capture runtime ML usage. Finally, we present essential quality analyses via an observation agent. That interprets ML inferences and evaluates contributions of ML inference microservices, assisting ML serving optimization. The agent also integrates ML algorithms for detecting relations among metrics, supporting constraint developments. We demonstrate our work with two real-world applications for malware and object detection.},
+booktitle = {Proceedings of the IEEE/ACM 3rd International Conference on AI Engineering - Software Engineering for AI},
+pages = {234–244},
+numpages = {11},
+keywords = {ML explainability engineering, ML contract, SLA management, ensemble ML, ML serving},
+location = {Lisbon, Portugal},
+series = {CAIN '24}
+}
+
+@inproceedings{pp2,
+author = {Lu, Qinghua and Zhu, Liming and Xu, Xiwei and Whittle, Jon and Xing, Zhenchang},
+title = {Towards a roadmap on software engineering for responsible AI},
+year = {2022},
+isbn = {9781450392754},
+publisher = {Association for Computing Machinery},
+address = {New York, NY, USA},
+url = {https://doi.org/10.1145/3522664.3528607},
+doi = {10.1145/3522664.3528607},
+abstract = {Although AI is transforming the world, there are serious concerns about its ability to behave and make decisions responsibly. Many ethical regulations, principles, and frameworks for responsible AI have been issued recently. However, they are high level and difficult to put into practice. On the other hand, most AI researchers focus on algorithmic solutions, while the responsible AI challenges actually crosscut the entire engineering lifecycle and components of AI systems. To close the gap in operationalizing responsible AI, this paper aims to develop a roadmap on software engineering for responsible AI. The roadmap focuses on (i) establishing multi-level governance for responsible AI systems, (ii) setting up the development processes incorporating process-oriented practices for responsible AI systems, and (iii) building responsible-AI-by-design into AI systems through system-level architectural style, patterns and techniques.},
+booktitle = {Proceedings of the 1st International Conference on AI Engineering: Software Engineering for AI},
+pages = {101–112},
+numpages = {12},
+keywords = {AI, DevOps, MLOps, ethics, machine learning, requirement engineering, responsible AI, software architecture, software engineering},
+location = {Pittsburgh, Pennsylvania},
+series = {CAIN '22}
+}
diff --git a/assignments/2024/mehrpanah_amir/main.tex b/assignments/2024/mehrpanah_amir/main.tex
@@ -0,0 +1,79 @@
+\documentclass[11 pt]{article}        	%sets the font to 12 pt and says this is an article (as opposed to book or other documents)
+\usepackage{amsfonts, amssymb}	
+\usepackage{float}
+\usepackage{graphicx}
+\usepackage{tikz}
+\usepackage{url}
+\usepackage[absolute,overlay]{textpos}
+\usepackage{xcolor}
+\usepackage{cite}
+\usepackage{amsmath}% packages to get the fonts, symbols used in most math
+
+%\usepackage{setspace}               		% Together with \doublespacing below allows for doublespacing of the document
+
+\oddsidemargin=-0.5cm                 	% These three commands create the margins required for class
+\setlength{\textwidth}{6in}  
+\setlength{\textheight}{8in}%
+% \addtolength{\voffset}{-50pt}        		%
+\addtolength{\hoffset}{30pt}
+% \addtolength{\headsep}{-10pt}           	%
+
+
+\pagestyle{myheadings}                           	% tells LaTeX to allow you to enter information in the heading
+\markright{\hfill 13th December 2024 \quad}
+
+%%% CHAT BOX
+
+%%% END CHAT BOX
+
+\newcommand{\eqn}[0]{\begin{array}{rcl}}%begin an aligned equation - allows for aligning = or inequalities.  Always use with $$ $$
+\newcommand{\eqnend}[0]{\end{array} }  	%end the aligned equation
+
+\newcommand{\qed}[0]{$\square$}        	% make an unfilled square the default for ending a proof
+\newcommand\restr[2]{{% we make the whole thing an ordinary symbol
+  \left. % automatically resize the bar with \right
+  #1 % the function
+  \right|_{#2} % this is the delimiter
+  }}
+\newcommand{\sign}[0]{\textrm{sign}}
+%\doublespacing                         	% Together with the package setspace above allows for doublespacing of the document
+
+\begin{document}
+
+
+\vspace{2em}
+\begin{center}
+    {\Huge Software Engineering for AI}\\
+    \vspace{1.5em}
+    Amir Mehrpanah (\url{[email protected]})
+\end{center}
+
+\section{Introduction to My Research Area}
+
+My research focuses on making AI easier to understand, which is often referred to as explainable AI (XAI). There’s still a lot of discussion about what “explainability” really means, but we already have some methods to dig into these models and try to figure out how they operate.
+So explainability is about understanding how AI makes decisions and why it performs the way it does.  As AI grows more complex and is applied in areas where mistakes can have serious consequences, this becomes more and more important.
+
+
+
+While much of AI research is focused on improving performance, my work is more about ensuring that AI systems are safe, reliable, and trustworthy. This is more related to things like accountability and transparency, which are indispensable for using AI responsibly in real-world scenarios.
+
+
+
+For example, imagine an AI that functions as a black box, and you have no idea why it’s making certain decisions. I look at how to uncover the patterns or features in the data that the AI relies on to make those decisions. In my PhD, I’m specifically working on explainability for vision models, such as those used for classification, but my interest extends to explainability in all types of AI systems.
+
+
+
+Given my background in mathematics, I approach these explainability problems with a formal perspective. I try to employ mathematical tools to analyze and formulate the challenges rigorously. 
+I hope that it results in a more precise and structured examination of XAI methods, which in turn leads to models that can be trusted in practical, real-world scenarios. I realized that without math it is almost impossible to develop objective, robust, and interpretable explanations.
+
+
+\input{p1}
+\input{p2}
+
+\section{Discussions on Papers}
+\input{pp1}
+\input{pp2}
+\newpage
+\bibliographystyle{plain}
+\bibliography{bib}
+\end{document}
diff --git a/assignments/2024/mehrpanah_amir/p1.tex b/assignments/2024/mehrpanah_amir/p1.tex
@@ -0,0 +1,43 @@
+\section{Ideas from Robert's lectures}
+
+\subsection{Validation and Verification in Software vs AI}
+Explanations for AI models arise from the fundamental need to verify human-made systems before integrating them into our daily lives. 
+Software systems are explicitly defined by humans, making them inherently explainable and interpretable. 
+In contrast, the behavior of AI systems emerges from the optimization of a continuous objective, making it unclear how they arrive at their conclusions.
+Hence, I believe the behavior of AI models is harder to investigate and attribute to certain parameters or input patterns.
+
+
+
+
+I believe XAI still lacks robust definitions for validation and verification. 
+In terms of validation, we still do not know if we are truly addressing the right questions. 
+Humans do not yet have a clear definition of what identifies a good explanation. 
+This uncertainty is likely a result of XAI research being in its early stages.
+
+
+
+When it comes to verifying explanations, I think we really need better ways to check if a model is making the right decisions for the wrong reasons. It’s a lot harder than regular software testing because models can seem super accurate but still rely on totally flawed logic. Unlike software, where we can usually predict how things will behave, AI models are optimized for specific outcomes, which can sometimes lead to surprising or even weird results.
+
+
+
+For example, a model might assume dogs always appear on grass and wolves on snow, which doesn’t hold up in the real world. This kind of faulty logic could make it label a dog on snow as a wolf. Right now, there’s no clear way to measure or explain this kind of behavior for individual examples, and that’s a big challenge we still need to figure out.
+
+
+
+Maybe one important aspect that is usually missed when comparing software testing and AI explainability, is the fact that variables defined by human are usually human understandable. On the other hand, input variables of an AI model can be pixels, and then the model creates different variables based on a 3x3 block of pixels. Despite the effort to make sense of these variables, the interpretation of those variables is still a mystery.
+
+
+\subsection{AI's Hidden Technical Debt}
+This phenomenon can also be seen in AI, where researchers often use common approaches simply because of convenience.
+From the perspective of an AI researcher who is focused on showing what is possible to do with AI, almost everything can be tried.
+They do not care if their decisions make sense in mathematics or if it can be justified in all cases.
+
+
+
+However, from the viewpoint of a XAI researcher, including myself, these decisions have accumulated and created a huge hidden technical debt.
+Because we do not know what are the long-term implications of such decisions, how they interact with each other, and how they can be explained.
+
+
+
+This issue is particularly everywhere in the AI community, where many large-scale models have become black boxes. 
+Despite their capabilities, we lack a clear understanding of how these models make decisions.
diff --git a/assignments/2024/mehrpanah_amir/p2.tex b/assignments/2024/mehrpanah_amir/p2.tex
@@ -0,0 +1,26 @@
+\section{Ideas from the Invited Speakers}
+
+\subsection{Adopting Transparent AI Transparent into Software Development}
+Many companies are fearing that they are falling behind in the AI race. 
+This concern makes them to try to integrate AI into their software by any means or use AI as a software development tool at the very least.
+This urge is in conflict with the safety concerns of SAAB and many other companies that are active in critical domains, such as military. Therefore, they cannot simply use AI tools provided online as it risks the unwanted leakage of information.
+
+
+
+I think this is the direct result of AI models being opaque. 
+As an example, we cannot make sure that these models have memorized parts of the code used in their training phase, neither we know how to remove or recover such information if any.
+
+\subsection{Using AI for Writing Tests}
+As I pointed this out in class during the Dhasarathy's presentation, I think it is safer to write the tests first, then let AI generate the code that passes the tests. 
+I think this is much safer and becomes easier for AI in the long run, since it is getting better and better at filling the gaps every day.
+
+
+
+It is important to note that writing tests is where a human judgement is necessary.
+Assuming that there is a bug in the code, and letting the AI decide to write the test for it, gives the AI the freedom to choose if it should pass the test or not.
+The AI model then may decide by mistake to incorporate a behavior coming from a bug into the test it generates, hence letting a bug pass as an expected behavior. 
+This can lead to drastic consequences if the bug gets noticed when the car is in the streets.
+
+
+
+This problem gets worse when we note that AI models are currently black boxes, so no one can make sure if the decisions that model is producing follows a certain logic, which is writing the correct test for a wrong code.
diff --git a/assignments/2024/mehrpanah_amir/pp1.tex b/assignments/2024/mehrpanah_amir/pp1.tex
@@ -0,0 +1,22 @@
+\subsection{Novel Contract-based Runtime Explainability Framework for End-to-End Ensemble Machine Learning Serving \cite{pp1}}
+
+This paper talks about making machine learning (ML) services more understandable and trustworthy, with an important constraint that they're used in real-time applications. This constraint that XAI methods should be real-time is not relevant at the current state of my research. 
+
+
+
+They introduce a new framework that allows AI service providers "explain" (more on this later) how their models are working real-time. This includes showing consumers the quality of their predictions, for example by showing accuracy, a measure of confidence. 
+
+
+
+They do this by adding explainability rules directly into service contracts (a contract between the service provider and the consumer), so that they know what to expect for. Another constraint in this paper is that it focuses on ensemble of AI models, where multiple models work together to improve predictions. This is a quite common practice in machine learning to use voting of multiple models to reach to a conclusion. Nonetheless, it makes it hard to provide one explanation for multiple models, specially when there are many of them.
+
+
+
+The framework proposed in this paper makes it easier to monitor these systems and adjust them in real time based on consumer feedback, and the claim is that it improves service quality and trust. The authors test their approach on two real-world applications: malware detection and CCTV surveillance, to verify their claims that it works in practice.
+
+
+
+I found this paper particularly interesting as it shows how the definition for explainability of AI systems can change from context to context. Here, explainability is defined as companies being "honest" with the consumer and show them some of the classical metrics. In contrast, in my thesis we define it very much differently, hence it cannot be achieved merely by showing a few numbers.
+
+I believe my research can give more depth to the report that a consumer might ask for, both in terms of content and type. So on top of classical metrics, we can pinpoint some of the features that has led to the current outcome. This way, the consumer can make sure that the outcome is fair, and is not based on wrong reasons.
+
diff --git a/assignments/2024/mehrpanah_amir/pp2.tex b/assignments/2024/mehrpanah_amir/pp2.tex
@@ -0,0 +1,17 @@
+\subsection{Towards a roadmap on software engineering for responsible AI \cite{pp2}}
+This paper focuses on creating practical ways to responsible and ethical AI systems that can be trusted. 
+It points out the fact that we have many high-level ethical principles, yet there is a gap in using those ideas in actual products. 
+This kind of work is important because it helps us bring AI into the real world responsibly. 
+Also, it is related to my research, because XAI can be one way of making sure that AI systems are actually doing what we think they are doing.
+Hence, they suggest three ways to fix the issue:
+\begin{itemize}
+    \item Having rules or guidelines at different levels. Including industry, organization, and teams. This way, we make sure everyone developing AI is on the same page.
+    \item Having ethics embedded in the development process. This means that fairness, privacy, and safety are checked at every step.
+    \item Designing AI systems while having responsibility in mind. 
+    This translates to techniques like accountability tools or privacy-friendly methods like federated learning.
+\end{itemize}
+
+This kind of work is important because it helps us bring AI into the real world responsibly. 
+Finally, this paper is related to my research, because XAI can be one way of making sure that AI systems are actually doing what we think they are doing.
+
+So one way of producing responsible AI systems is designing tests that uncover the inner workings of an AI system but designing tests requires a mental model of how things work, which I believe requires XAI.