forked from ChiaXinLiang/MLLM-book
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge branch 'dev' into marcus_brach
- Loading branch information
Showing
23 changed files
with
1,215 additions
and
46 deletions.
There are no files selected for viewing
Empty file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
.cursorrules |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1 @@ | ||
MLLM_Reference |
12 changes: 12 additions & 0 deletions
12
...nd_Importance/Why do LLaVA Vision-Language Models Reply to Images in English.md
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,12 @@ | ||
title: Why do LLaVA Vision-Language Models Reply to Images in English? | ||
|
||
key_word: MLLM, VLM | ||
|
||
date of publish: 2024.07 | ||
|
||
Core idea: | ||
1. abstract: This paper investigates a significant multilingual bias in LLaVA-style vision-language models (VLMs), revealing that including an image in a query substantially increases the likelihood of the model responding in English, regardless of the query's original language. | ||
2. gap of current research: Current VLMs show a critical bias towards English in multimodal contexts, limiting their effectiveness in non-English language environments. | ||
3. innovation: The study employs a dual approach, combining extensive design space ablation with mechanistic analysis of the models' internal representations. | ||
4. method: The research utilizes a comprehensive methodology including design space exploration and in-depth analysis of model internals to identify the source and nature of the language bias. | ||
5. contribution: This research contributes to the development of more inclusive VLMs that can better serve non-English contexts, addressing a critical gap in current VLM capabilities and paving the way for more linguistically diverse multimodal AI systems. |
Empty file.
Binary file added
BIN
+1.85 MB
...eference/Chapter_1/1.1_Definition_and_Importance/figure_reference/why llava.jpg
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,115 @@ | ||
@article{einstein, | ||
author = "Albert Einstein", | ||
title = "On the Electrodynamics of Moving Bodies", | ||
journal = "Annalen der Physik", | ||
year = "1905", | ||
volume = "322", | ||
pages = "891--921" | ||
} | ||
|
||
@article{konidena2024ethical, | ||
title={Ethical Considerations in the Development and Deployment of AI Systems}, | ||
author={Konidena, Bhargav Kumar and Malaiyappan, Jesu Narkarunai Arasu and Tadimarri, Anish}, | ||
journal={European Journal of Technology}, | ||
volume={8}, | ||
number={2}, | ||
pages={41--53}, | ||
year={2024} | ||
} | ||
|
||
@article{peng2024securing, | ||
title={Securing Large Language Models: Addressing Bias, Misinformation, and Prompt Attacks}, | ||
author={Peng, Benji and Chen, Keyu and Li, Ming and Feng, Pohsun and Bi, Ziqian and Liu, Junyu and Niu, Qian}, | ||
journal={arXiv preprint arXiv:2409.08087}, | ||
year={2024} | ||
} | ||
|
||
@article{boix2022machine, | ||
title={Can machine-learning models overcome biased datasets?}, | ||
author={Boix, Xavier and Tenenbaum, Joshua B. and Torralba, Antonio}, | ||
journal={MIT News}, | ||
year={2022}, | ||
url={https://news.mit.edu/2022/machine-learning-biased-data-0221} | ||
} | ||
|
||
@misc{pymetrics2022audit, | ||
title={audit-AI: Open Sourced Bias Testing for Generalized Machine Learning Applications}, | ||
author={pymetrics}, | ||
year={2022}, | ||
howpublished={\url{https://github.com/pymetrics/audit-ai}}, | ||
note={GitHub repository} | ||
} | ||
|
||
@inproceedings{kim2024domain, | ||
title={Domain-Aware Fine-Tuning: Enhancing Neural Network Adaptability}, | ||
author={Seokhyeon Ha, Sunbeom Jung, Jungwoo Lee}, | ||
booktitle={Proceedings of the 38th AAAI Conference on Artificial Intelligence}, | ||
year={2024} | ||
} | ||
|
||
@article{zhang2023mitigating, | ||
title={Bias-Aware Low-Rank Adaptation: Mitigating Catastrophic Inheritance of Large Language Models}, | ||
author={Zhang, Xingchen and Ren, Zhuosheng and Jiang, Yihong and Zhao, Dongyan and Zhang, Rui}, | ||
journal={arXiv preprint arXiv:2408.04556}, | ||
year={2023} | ||
} | ||
|
||
@article{aquino2023practical, | ||
title={Practical, epistemic and normative implications of algorithmic bias in healthcare artificial intelligence: a qualitative study of multidisciplinary expert perspectives}, | ||
author={Aquino, Yves Saint James and Carter, Stacy M and Houssami, Nehmat and Braunack-Mayer, Annette and Win, Khin Than and Degeling, Chris and Wang, Lei and Rogers, Wendy A}, | ||
journal={Journal of Medical Ethics}, | ||
year={2023}, | ||
publisher={Institute of Medical Ethics} | ||
} | ||
|
||
@article{he2024emerged, | ||
title={The Emerged Security and Privacy of LLM Agent: A Survey with Case Studies}, | ||
author={He, Feng and Zhu, Tianqing and Ye, Dayong and Liu, Bo and Zhou, Wanlei and Yu, Philip S}, | ||
journal={arXiv preprint arXiv:2407.19354}, | ||
year={2024} | ||
} | ||
|
||
@article{friha2024llm, | ||
title={LLM-Based Edge Intelligence: A Comprehensive Survey on Architectures, Applications, Security and Trustworthiness}, | ||
author={Friha, Othmane and Ferrag, Mohamed Amine and Kantarci, Burak and Cakmak, Burak and Ozgun, Arda and Ghoualmi-Zine, Nassira}, | ||
journal={IEEE Open Journal of the Communications Society}, | ||
year={2024}, | ||
publisher={IEEE} | ||
} | ||
|
||
@article{mccoy2023ethical, | ||
title={Ethical responsibilities for companies that process personal data}, | ||
author={McCoy, Matthew S and Allen, Anita L and Kopp, Katharina and Mello, Michelle M and Patil, DJ and Ossorio, Pilar and Joffe, Steven and Emanuel, Ezekiel J}, | ||
journal={The American Journal of Bioethics}, | ||
volume={23}, | ||
number={11}, | ||
pages={11--23}, | ||
year={2023}, | ||
publisher={Taylor \& Francis} | ||
} | ||
|
||
@article{chen2024trustworthy, | ||
title={Trustworthy, Responsible, and Safe AI: A Comprehensive Architectural Framework for AI Safety with Challenges and Mitigations}, | ||
author={Chen, Chen and Liu, Ziyao and Jiang, Weifeng and Qi, Goh Si and Lam, KwoK-Yan}, | ||
journal={arXiv preprint arXiv:2408.12935}, | ||
year={2024} | ||
} | ||
|
||
@article{ray2023chatgpt, | ||
title={ChatGPT: A comprehensive review on background, applications, key challenges, bias, ethics, limitations and future scope}, | ||
author={Ray, Partha Pratim}, | ||
journal={Internet of Things and Cyber-Physical Systems}, | ||
volume={3}, | ||
pages={121--154}, | ||
year={2023}, | ||
publisher={Elsevier} | ||
} | ||
|
||
@incollection{rosenstrauch2023artificial, | ||
title={Artificial Intelligence and Ethics}, | ||
author={Rosenstrauch, Doreen and Mangla, Utpal and Gupta, Atul and Masau, Costansia Taikwa}, | ||
booktitle={Digital Health Entrepreneurship}, | ||
pages={225--239}, | ||
year={2023}, | ||
publisher={Springer} | ||
} |
Oops, something went wrong.