-
Notifications
You must be signed in to change notification settings - Fork 18
/
Copy pathpangu-spacing.el
357 lines (304 loc) · 13.3 KB
/
pangu-spacing.el
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
;;; pangu-spacing.el --- Minor-mode to add space between Chinese and English characters.
;; Copyright (C) 2013, 2014 Yen-Chin, Lee.
;; Author: coldnew <coldnew.tw@gmail.com>
;; Kyewords: converience
;; Version: 0.4
;; X-URL: http://github.com/coldnew/pangu-spacing
;; URL: http://github.com/coldnew/pangu-spacing
;; This file is free software: you can redistribute it and/or modify
;; it under the terms of the GNU General Public License as published by
;; the Free Software Foundation, either version 3 of the License, or
;; (at your option) any later version.
;; This file is distributed in the hope that it will be useful,
;; but WITHOUT ANY WARRANTY; without even the implied warranty of
;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
;; GNU General Public License for more details.
;; You should have received a copy of the GNU General Public License
;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>.
;;; Commentary:
;;; Screenshot:
;; ![Screenshot](https://github.com/coldnew/pangu-spacing/raw/master/screenshot/screenshot.gif)
;;; Commentary (English):
;; pangu-spacing-mode is an minor-mode to auto add `space' between Chinese
;; and English characters. Note that these whitespace characters are not really
;; added to your file. It's just a local visual change.
;; Take following sentance for example:
;;
;; 你好,我是coldnew,我喜歡使用emacs。
;;
;; After you use pangu-spacing-mode, you will see
;;
;; 你好,我是 coldnew,我喜歡使用 emacs。
;;
;; But the text doesn't get modified by this mode. After disabling
;; pangu-spacing-mode, or when using another text editor to open the file, you
;; will still see:
;;
;; 你好,我是coldnew,我喜歡使用emacs。
;; pangu-spacing is named from [pangu.js](https://github.com/vinta/pangu.js)'s README.
;;
;; Translation of pangu.js's README [1]
;;
;; If you are the one who feel quiet ill when see Chinese,
;; English and digits characters squeezed together and
;; want to add whitespace to separate them, this plugin (support
;; Chrome and Firefox) is what you need when surfing the
;; internet. It will add whitespace between Chinese,
;; half-width English, digits and symbols automatically.
;; These spaces between English and Chinese characters are called
;; pangu-spacing by a sinologist, since it breaks the confusion
;; between full-width and half-width characters.
;; Studies showed that people who dislike adding whitespace between
;; English and Chinese characters also have relationship problems.
;; Almost 70 percent of them will get married to the one they
;; don't love, the rest are only left to their cat.
;; Indeed, love and writing need some space in good time.
;; Let's go for it.
;; [1] https://github.com/vinta/pangu.js
;;; Commentary (Chinese):
;; pangu-spacing-mode 是一個可以自動幫你將中文與英文之間加上`空白'作為分隔的 minor-mode, 他的名稱來自於 [pangu.js](https://github.com/vinta/pangu.js) 上的 README。
;;
;; 引述自 pangu.js README [1]
;;
;; 如果你跟我一樣,每次看到網頁上的中文字和英文、數字、符號擠在一塊,就會
;; 坐立難安,忍不住想在它們之間加個空格。這個外掛(支援 Chrome 和 Firefox)
;; 正是你在網路世界走跳所需要的東西,它會自動替你在網頁中所有的中文字和半
;; 形的英文、數字、符號之間插入空白。
;;
;; 漢學家稱這個空白字元為「盤古之白」,因為它劈開了全形字和半形字之間的混
;; 沌。另有研究顯示,打字的時候不喜歡在中文和英文之間加空格的人,感情路都
;; 走得很辛苦,有七成的比例會在 34 歲的時候跟自己不愛的人結婚,而其餘三成
;; 的人最後只能把遺產留給自己的貓。畢竟愛情跟書寫都需要適時地留白。
;;
;; 與大家共勉之。
;; [1] https://github.com/vinta/pangu.js
;;; Installation:
;; If you have `melpa` and `emacs24` installed, simply type:
;;
;; M-x package-install pangu-spacing
;;
;; For `cask' user, just add following lines in your `Cask' file
;;
;; ```elisp
;; (source melpa)
;;
;; (depends-on "pangu-spacing")
;; ```
;;
;;; Configuration
;; In your .emacs
;;
;; ```elisp
;; (require 'pangu-spacing)
;; (global-pangu-spacing-mode 1)
;; ```
;;
;; pangu-spacing-mode does not actuall yinsert space between English and
;; Chinese by default. If you want this behaviour, enable this option manually.
;;
;; ```elisp
;; (setq pangu-spacing-real-insert-separtor t)
;; ```
;;
;; After enabling this, pangu-space will be inserted before you save file.
;;
;; If you only want to insert whitespace in some specific mode, but add
;; virtual space in another mode, you can use following code to achieve
;; this: (take org-mode as example)
;;
;; ```elisp
;; (add-hook 'org-mode-hook
;; '(lambda ()
;; (set (make-local-variable 'pangu-spacing-real-insert-separtor) t)))
;; ```
;;
;;; Code:
(defgroup pangu-spacing nil
"Add space between Chinese and English characters automatically."
:group 'convenience
:link '(url-link :tag "Github" "https://github.com/coldnew/pangu-spacing"))
;;;; Custom Variables
(defcustom pangu-spacing-separator " "
"String to be displayed between Chinese and English."
:group 'pangu-spacing
:type 'string
:initialize 'custom-initialize-default)
(defcustom pangu-spacing-real-insert-separtor nil
"Set t or nil to make space show only on overlay or insert in file.
When you set t here, the space will be insert when you save file."
:group 'pangu-spacing
:type 'boolean)
(defface pangu-spacing-separator-face nil
"Face for pangu-spacing-mode separator."
:group 'pangu-spacing)
(defcustom pangu-spacing-inhibit-mode-alist '(eshell-mode shell-mode term-mode)
"Inhibit mode alist for pangu-spacing-mode."
:group 'pangu-spacing
:type 'list)
;;;; Local variables
;; NOTE:
;; We use `chinse-two-byte' instead of `chinese-two-byte', since there
;; are some typo in emacs version 21.1-24.3. For more information,
;; see:
;;
;; [Emacs-diffs] trunk r115873: Fix misspelling of 'chinese' in rx.
;;
;; Url: http://lists.gnu.org/archive/html/emacs-diffs/2014-01/msg00049.html
;;
(eval-when-compile (require 'rx))
(defun pangu-spacing-chinese-two-byte-category ()
"Return the correct category name for Chinese two-byte characters."
(if (assq 'chinese-two-byte rx--categories)
"chinese-two-byte"
"chinse-two-byte"))
(defvar pangu-spacing-include-regexp
;; we didn't add korean because korean-hangul-two-byte is not implemented
(eval `(rx (or (and (or (group-n 3 (any "。,!?;:「」()、"))
(group-n 1 (or (category ,(intern (pangu-spacing-chinese-two-byte-category)))
(category japanese-hiragana-two-byte)
(category japanese-katakana-two-byte))))
(group-n 2 (in "a-zA-Z0-9")))
(and (group-n 1 (in "a-zA-Z0-9"))
(or (group-n 3 (any "。,!?;:「」()、"))
(group-n 2 (or (category ,(intern (pangu-spacing-chinese-two-byte-category)))
(category japanese-hiragana-two-byte)
(category japanese-katakana-two-byte))))))))
"Regexp to find Chinese character before English character.
Group 1 contains the character before the potential pangu
spacing, and group 2 the character after that. A space is needed
when both group 1 and group 2 are non-nil. Group 3 exists as a
workaround for excluded characters. Since rx does not support
matching text that satisfy two regexp at the same time (we want
to match all Chinese two byte characters, but not punctuations),
we first try to match excluded characters, then the characters
that need pangu-spacing. The excluded characters will be matched
to group 3, and shortcut the matching for Chinese characters.
Thus group 1 and group 2 will both be non nil when a pangu space
is needed.")
;;;; Functions
(defmacro pangu-spacing-search-buffer (regexp start end func)
"Helper macro to search buffer and do func according regexp for
pangu-spacing-mode."
`(let ((start ,start) (end ,end))
(save-excursion
(goto-char start)
(while (re-search-forward ,regexp end t)
(when (and (match-beginning 1)
(match-beginning 2))
,func
(backward-char))))))
(defmacro pangu-spacing-search-overlay (beg end func regexp)
"Helper macro to search and update overlay according func and regexp for
pangu-sapce-mode."
`(pangu-spacing-search-buffer ,regexp ,beg ,end
(,func (match-beginning 1) (match-end 1))))
(defun pangu-spacing-org-mode-at-special-region ()
(interactive)
(let ((element (org-element-at-point)))
(when (or (member (org-element-type element)
'(src-block keyword example-block export-block
latex-environment planning))
(member (car (org-element-context element))
'(inline-src-block timestamp link code verbatim)))
t)))
(defcustom pangu-spacing-special-region-func-alist
'((org-mode . pangu-spacing-org-mode-at-special-region))
"Alist mapping major-mode to the corresponding function to
check for special region that shall not write real pangu-space"
:group 'pangu-spacing
:type '(alist :key-type (symbol)
:value-type (function)))
(defun pangu-spacing-search-and-replace (match regexp)
"Replace regexp with match in buffer."
(let ((at-special-region-func
(cdr (assq major-mode pangu-spacing-special-region-func-alist))))
(pangu-spacing-search-buffer
regexp (point-min) (point-max)
(unless (and at-special-region-func
(save-match-data (funcall at-special-region-func)))
(replace-match match nil nil)))))
(defun pangu-spacing-overlay-p (ov)
"Determine whether overlay OV was created by space-between."
(and (overlayp ov) (overlay-get ov 'pangu-spacing-overlay)))
(defun pangu-spacing-check-overlay (beg end)
"Insert a space between English words and Chinese characters in overlay."
(setq beg (if beg
(max (- beg 1) (point-min))
(point-min))
end (or end (point-max)))
(pangu-spacing-delete-overlay beg end)
(setq end (min (1+ end) (point-max)))
(pangu-spacing-search-overlay beg end
pangu-spacing-make-overlay
pangu-spacing-include-regexp)
)
(defun pangu-spacing-modify-buffer ()
"Real insert separator between English words and Chinese characters in buffer."
(when pangu-spacing-real-insert-separtor
(pangu-spacing-search-and-replace "\\1 \\2"
pangu-spacing-include-regexp))
;; nil must be returned to allow use in write file hooks
nil)
(defun pangu-spacing-region-has-pangu-spacing-overlays (beg end)
"Check if region specified by BEG and END has overlay.
Return t if it has at least one pangu-spacing overlay, nil if no overlay."
(let ((ov (overlays-in beg end))
(has-pangu-spacing-overlays nil))
(while (consp ov)
(when (pangu-spacing-overlay-p (car ov))
(setq has-pangu-spacing-overlays t
;; break the while loop
ov nil))
(setq ov (cdr ov))
has-pangu-spacing-overlays)))
(defun pangu-spacing-make-overlay (beg end)
"Allocate a pangu-spacing overlay in range."
(when (not (pangu-spacing-region-has-pangu-spacing-overlays beg end))
(let ((ov (make-overlay beg end nil t t))
(face 'pangu-spacing-separator-face))
(overlay-put ov 'pangu-spacing-overlay t)
(overlay-put ov 'after-string (propertize pangu-spacing-separator 'face face))
ov)))
(defun pangu-spacing-delete-overlay (beg end)
"Delete all pangu-spacing-overlays in BUFFER."
(dolist (ov (overlays-in beg end))
(when (pangu-spacing-overlay-p ov)
(delete-overlay ov))))
(defun pangu-spacing-delete-all-overlays (&optional beg end)
"Delete all pangu-spacing-overlays in BUFFER."
(pangu-spacing-delete-overlay (point-min) (point-max)))
(defun turn-on-pangu-spacing (beg end)
(pangu-spacing-check-overlay beg end))
;;;###autoload
(defun pangu-spacing-space-current-buffer ()
"Space current buffer.
It will really insert separator, no matter what
`pangu-spacing-real-insert-separtor' is."
(interactive)
(let ((pangu-spacing-real-insert-separtor t))
(pangu-spacing-modify-buffer)))
;;;###autoload
(define-minor-mode pangu-spacing-mode
"Toggle pangu-spacing-mode"
:group 'pangu-spacing
:global nil
:init-value nil
:lighter " Ρ"
(unless (or (member major-mode pangu-spacing-inhibit-mode-alist)
(minibufferp (current-buffer)))
(save-restriction
(widen)
(if pangu-spacing-mode
(progn
(jit-lock-register 'turn-on-pangu-spacing)
(add-hook 'local-write-file-hooks 'pangu-spacing-modify-buffer))
(progn
(jit-lock-unregister 'turn-on-pangu-spacing)
(remove-hook 'local-write-file-hooks 'pangu-spacing-modify-buffer)
(pangu-spacing-delete-all-overlays)))))
pangu-spacing-mode)
;;;###autoload
(define-globalized-minor-mode global-pangu-spacing-mode
pangu-spacing-mode pangu-spacing-mode)
(provide 'pangu-spacing)
;;; pangu-spacing.el ends here