czczup commited on
Commit
7c93434
·
verified ·
1 Parent(s): 2e811e4

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +6 -12
README.md CHANGED
@@ -11,10 +11,6 @@ language:
11
  - multilingual
12
  tags:
13
  - internvl
14
- - vision
15
- - ocr
16
- - multi-image
17
- - video
18
  - custom_code
19
  ---
20
 
@@ -99,8 +95,6 @@ This model can also conduct an in-depth analysis of AAAI's official website and
99
 
100
  We provide an example code to run InternVL-Chat-V1-1 using `transformers`.
101
 
102
- We also welcome you to experience the InternVL2 series models in our [online demo](https://internvl.opengvlab.com/).
103
-
104
  > Please use transformers>=4.37.2 to ensure the model works normally.
105
 
106
  ### Model Loading
@@ -500,16 +494,16 @@ If you find this project useful in your research, please consider citing:
500
  journal={arXiv preprint arXiv:2410.16261},
501
  year={2024}
502
  }
503
- @article{chen2023internvl,
504
- title={InternVL: Scaling up Vision Foundation Models and Aligning for Generic Visual-Linguistic Tasks},
505
- author={Chen, Zhe and Wu, Jiannan and Wang, Wenhai and Su, Weijie and Chen, Guo and Xing, Sen and Zhong, Muyan and Zhang, Qinglong and Zhu, Xizhou and Lu, Lewei and Li, Bin and Luo, Ping and Lu, Tong and Qiao, Yu and Dai, Jifeng},
506
- journal={arXiv preprint arXiv:2312.14238},
507
- year={2023}
508
- }
509
  @article{chen2024far,
510
  title={How Far Are We to GPT-4V? Closing the Gap to Commercial Multimodal Models with Open-Source Suites},
511
  author={Chen, Zhe and Wang, Weiyun and Tian, Hao and Ye, Shenglong and Gao, Zhangwei and Cui, Erfei and Tong, Wenwen and Hu, Kongzhi and Luo, Jiapeng and Ma, Zheng and others},
512
  journal={arXiv preprint arXiv:2404.16821},
513
  year={2024}
514
  }
 
 
 
 
 
 
515
  ```
 
11
  - multilingual
12
  tags:
13
  - internvl
 
 
 
 
14
  - custom_code
15
  ---
16
 
 
95
 
96
  We provide an example code to run InternVL-Chat-V1-1 using `transformers`.
97
 
 
 
98
  > Please use transformers>=4.37.2 to ensure the model works normally.
99
 
100
  ### Model Loading
 
494
  journal={arXiv preprint arXiv:2410.16261},
495
  year={2024}
496
  }
 
 
 
 
 
 
497
  @article{chen2024far,
498
  title={How Far Are We to GPT-4V? Closing the Gap to Commercial Multimodal Models with Open-Source Suites},
499
  author={Chen, Zhe and Wang, Weiyun and Tian, Hao and Ye, Shenglong and Gao, Zhangwei and Cui, Erfei and Tong, Wenwen and Hu, Kongzhi and Luo, Jiapeng and Ma, Zheng and others},
500
  journal={arXiv preprint arXiv:2404.16821},
501
  year={2024}
502
  }
503
+ @article{chen2023internvl,
504
+ title={InternVL: Scaling up Vision Foundation Models and Aligning for Generic Visual-Linguistic Tasks},
505
+ author={Chen, Zhe and Wu, Jiannan and Wang, Wenhai and Su, Weijie and Chen, Guo and Xing, Sen and Zhong, Muyan and Zhang, Qinglong and Zhu, Xizhou and Lu, Lewei and Li, Bin and Luo, Ping and Lu, Tong and Qiao, Yu and Dai, Jifeng},
506
+ journal={arXiv preprint arXiv:2312.14238},
507
+ year={2023}
508
+ }
509
  ```