Skip to content

Commit dcabd45

Browse files
authored
ci: release pkgs (#12)
* chore(ci): ui-tars packages publish * chore(ci): add changeset for ui-tars pkgs * refactor(shared): desktop-shared rename to shared * docs: ollama * chore: prepublish * chore: pkgs version * chore: publish scripts
1 parent 8263c6c commit dcabd45

File tree

28 files changed

+459
-103
lines changed

28 files changed

+459
-103
lines changed

.changeset/README.md

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,8 @@
1+
# Changesets
2+
3+
Hello and welcome! This folder has been automatically generated by `@changesets/cli`, a build tool that works
4+
with multi-package repos, or single-package repos to help you version and publish your code. You can
5+
find the full documentation for it [in our repository](https://github.com/changesets/changesets)
6+
7+
We have a quick list of common questions to get you started engaging with this project in
8+
[our documentation](https://github.com/changesets/changesets/blob/main/docs/common-questions.md)

.changeset/config.json

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,13 @@
1+
{
2+
"$schema": "https://unpkg.com/@changesets/config@3.0.5/schema.json",
3+
"changelog": "@changesets/cli/changelog",
4+
"commit": false,
5+
"fixed": [],
6+
"linked": [],
7+
"access": "restricted",
8+
"baseBranch": "main",
9+
"updateInternalDependencies": "patch",
10+
"ignore": [
11+
"ui-tars-desktop"
12+
]
13+
}

.changeset/lazy-pots-joke.md

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,6 @@
1+
---
2+
'@ui-tars/action-parser': major
3+
'@ui-tars/shared': major
4+
---
5+
6+
feat: initial publish ui-tars action-parser and shared pkgs

README.md

Lines changed: 14 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@ UI-TARS Desktop is a GUI Agent application based on [UI-TARS (Vision-Language Mo
1111
<p align="center">
1212
&nbsp&nbsp 📑 <a href="https://arxiv.org/abs/2501.12326">Paper</a> &nbsp&nbsp
1313
| 🤗 <a href="https://huggingface.co/bytedance-research/UI-TARS-7B-SFT">Hugging Face Models</a>&nbsp&nbsp
14-
|
14+
|
1515
<br>
1616
🖥️ Desktop Application &nbsp&nbsp
1717
| &nbsp&nbsp 👓 <a href="https://github.com/web-infra-dev/midscene">Midscene (use in browser)</a>
@@ -45,6 +45,10 @@ You can download the [latest release](https://github.com/bytedance/UI-TARS-deskt
4545
1. Drag **UI TARS** application into the **Applications** folder
4646
<img src="./images/mac_install.png" width="500px" />
4747

48+
> **Note**: If app broken, you can use `sudo xattr -dr com.apple.quarantine /Applications/UI\ TARS.app` in Terminal to fix it.
49+
>
50+
> <img src="./images/mac_broken.png" width="400px" />
51+
4852
2. Enable the permission of **UI TARS** in MacOS:
4953
- System Settings -> Privacy & Security -> **Accessibility**
5054
- System Settings -> Privacy & Security -> **Screen Recording**
@@ -53,9 +57,6 @@ You can download the [latest release](https://github.com/bytedance/UI-TARS-deskt
5357
3. Then open **UI TARS** application, you can see the following interface:
5458
<img src="./images/mac_app.png" width="500px" />
5559

56-
> **Note**: If app broken, you can use `sudo xattr -dr com.apple.quarantine /Applications/UI\ TARS.app` in Terminal to fix it.
57-
>
58-
> <img src="./images/mac_broken.png" width="400px" />
5960

6061
#### Windows
6162

@@ -76,6 +77,15 @@ We recommend using HuggingFace Inference Endpoints for fast deployment. We provi
7677

7778
<img src="./images/settings_model.png" width="500px" />
7879

80+
If you use Ollama, you can use the following command to start the server:
81+
82+
```yaml
83+
VLM Provider: ollama
84+
VLM Base Url: http://localhost:11434/v1
85+
VLM API Key: api_key
86+
VLM Model Name: ui-tars
87+
```
88+
7989
> **Note**: VLM Base Url is OpenAI compatible API endpoints (see [OpenAI API protocol document](https://platform.openai.com/docs/guides/vision/uploading-base-64-encoded-images) for more details).
8090
8191
## Development

package.json

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,7 @@
3333
"publish:win32": "npm run build && electron-forge publish --arch=x64 --platform=win32",
3434
"publish:win32-arm64": "npm run build && electron-forge publish --arch=arm64 --platform=win32",
3535
"publish": "npm run build && electron-forge publish",
36+
"publish:packages": "pnpm changeset:version && pnpm install && changeset tag && pnpm publish -r --no-git-checks --access public",
3637
"prepare": "husky"
3738
},
3839
"dependencies": {
@@ -42,7 +43,7 @@
4243
"@electron-toolkit/utils": "^3.0.0",
4344
"@electron/notarize": "^2.3.2",
4445
"@ui-tars/action-parser": "workspace:*",
45-
"@ui-tars/desktop-shared": "workspace:*",
46+
"@ui-tars/shared": "workspace:*",
4647
"async-retry": "^1.3.3",
4748
"dotenv": "^16.4.7",
4849
"electron-debug": "^3.2.0",
@@ -81,6 +82,7 @@
8182
"devDependencies": {
8283
"@chakra-ui/react": "2.10.4",
8384
"@chakra-ui/theme-tools": "^2.2.6",
85+
"@changesets/cli": "^2.27.11",
8486
"@commitlint/cli": "^19.6.1",
8587
"@commitlint/config-conventional": "^19.6.0",
8688
"@electron-forge/cli": "^7.6.0",

packages/action-parser/package.json

Lines changed: 14 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,25 +1,33 @@
11
{
22
"name": "@ui-tars/action-parser",
3-
"version": "1.0.0",
3+
"version": "0.0.1",
4+
"description": "Action parser SDK for UI-TARS",
5+
"keywords": [
6+
"AI",
7+
"Action",
8+
"Parser",
9+
"UI-TARS"
10+
],
411
"main": "./dist/index.js",
512
"module": "./dist/index.mjs",
613
"types": "./dist/index.d.ts",
714
"scripts": {
815
"dev": "tsup --watch",
16+
"prepublishOnly": "npm run build",
917
"prepare": "npm run build",
1018
"build": "tsup",
1119
"test": "vitest",
1220
"prepack": "npm run build"
1321
},
14-
"keywords": [],
15-
"author": "",
16-
"license": "ISC",
17-
"description": "",
22+
"license": "Apache-2.0",
1823
"files": [
1924
"dist"
2025
],
26+
"publishConfig": {
27+
"registry": "https://registry.npmjs.org"
28+
},
2129
"dependencies": {
22-
"@ui-tars/desktop-shared": "workspace:*"
30+
"@ui-tars/shared": "workspace:*"
2331
},
2432
"devDependencies": {
2533
"tsup": "^8.3.5",

packages/action-parser/src/index.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
* Copyright (c) 2025 Bytedance, Inc. and its affiliates.
33
* SPDX-License-Identifier: Apache-2.0
44
*/
5-
import { ActionInputs, PredictionParsed } from '@ui-tars/desktop-shared/types';
5+
import { ActionInputs, PredictionParsed } from '@ui-tars/shared/types';
66

77
export function actionParser(params: { prediction: string; factor: number }): {
88
parsed: PredictionParsed[];

packages/shared/package.json

Lines changed: 12 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
{
2-
"name": "@ui-tars/desktop-shared",
3-
"version": "1.0.0",
2+
"name": "@ui-tars/shared",
3+
"version": "0.0.1",
4+
"description": "Shared types for UI-TARS",
45
"exports": {
56
"./types": {
67
"import": "./dist/types/index.mjs",
@@ -24,21 +25,23 @@
2425
}
2526
},
2627
"scripts": {
28+
"prepublishOnly": "npm run build",
2729
"prepare": "npm run build",
2830
"dev": "tsup --watch",
2931
"build": "tsup",
3032
"prepack": "npm run build"
3133
},
32-
"keywords": [],
33-
"author": "",
34-
"license": "ISC",
35-
"description": "",
34+
"keywords": [
35+
"UI-TARS"
36+
],
37+
"license": "Apache-2.0",
38+
"publishConfig": {
39+
"registry": "https://registry.npmjs.org/"
40+
},
3641
"files": [
3742
"dist"
3843
],
39-
"dependencies": {
40-
"nanoid": "3.3.5"
41-
},
44+
"dependencies": {},
4245
"devDependencies": {
4346
"tsup": "^8.3.5",
4447
"typescript": "^5.7.2"

packages/shared/src/utils/random.ts

Lines changed: 0 additions & 17 deletions
This file was deleted.

packages/visualizer/package.json

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,7 @@
22
"name": "@ui-tars/visualizer",
33
"description": "Visualizer for Computer Use forked from @midscene/visualizer",
44
"version": "0.0.1",
5+
"private": true,
56
"repository": "https://github.com/web-infra-dev/midscene",
67
"homepage": "https://midscenejs.com/",
78
"types": "./dist/types/index.d.ts",

0 commit comments

Comments
 (0)