mirror of
https://github.com/microsoft/PowerToys.git
synced 2024-12-19 14:27:55 +08:00
524 lines
14 KiB
Plaintext
524 lines
14 KiB
Plaintext
# marker to ignore all code on line
|
|
^.*/\* #no-spell-check-line \*/.*$
|
|
# marker for ignoring a comment to the end of the line
|
|
// #no-spell-check.*$
|
|
|
|
# patch hunk comments
|
|
^\@\@ -\d+(?:,\d+|) \+\d+(?:,\d+|) \@\@ .*
|
|
# git index header
|
|
index [0-9a-z]{7,40}\.\.[0-9a-z]{7,40}
|
|
|
|
# cid urls
|
|
(['"])cid:.*?\g{-1}
|
|
|
|
# data url in parens
|
|
\(data:[^)]*?(?:[A-Z]{3,}|[A-Z][a-z]{2,}|[a-z]{3,})[^)]*\)
|
|
# data url in quotes
|
|
([`'"])data:.*?(?:[A-Z]{3,}|[A-Z][a-z]{2,}|[a-z]{3,}).*\g{-1}
|
|
# data url
|
|
data:[-a-zA-Z=;:/0-9+]*,\S*
|
|
|
|
# mailto urls
|
|
mailto:[-a-zA-Z=;:/?%&0-9+@.]{3,}
|
|
|
|
# magnet urls
|
|
magnet:[?=:\w]+
|
|
|
|
# magnet urls
|
|
"magnet:[^"]+"
|
|
|
|
# obs:
|
|
"obs:[^"]*"
|
|
|
|
# The `\b` here means a break, it's the fancy way to handle urls, but it makes things harder to read
|
|
# In this examples content, I'm using a number of different ways to match things to show various approaches
|
|
# asciinema
|
|
\basciinema\.org/a/[0-9a-zA-Z]+
|
|
|
|
# apple
|
|
\bdeveloper\.apple\.com/[-\w?=/]+
|
|
# Apple music
|
|
\bembed\.music\.apple\.com/fr/playlist/usr-share/[-\w.]+
|
|
|
|
# appveyor api
|
|
\bci\.appveyor\.com/api/projects/status/[0-9a-z]+
|
|
# appveyor project
|
|
\bci\.appveyor\.com/project/(?:[^/\s"]*/){2}builds?/\d+/job/[0-9a-z]+
|
|
|
|
# Amazon
|
|
|
|
# Amazon
|
|
\bamazon\.com/[-\w]+/(?:dp/[0-9A-Z]+|)
|
|
# AWS S3
|
|
\b\w*\.s3[^.]*\.amazonaws\.com/[-\w/&#%_?:=]*
|
|
# AWS execute-api
|
|
\b[0-9a-z]{10}\.execute-api\.[-0-9a-z]+\.amazonaws\.com\b
|
|
# AWS ELB
|
|
\b\w+\.[-0-9a-z]+\.elb\.amazonaws\.com\b
|
|
# AWS SNS
|
|
\bsns\.[-0-9a-z]+.amazonaws\.com/[-\w/&#%_?:=]*
|
|
# AWS VPC
|
|
vpc-\w+
|
|
|
|
# While you could try to match `http://` and `https://` by using `s?` in `https?://`, sometimes there
|
|
# YouTube url
|
|
\b(?:(?:www\.|)youtube\.com|youtu.be)/(?:channel/|embed/|user/|playlist\?list=|watch\?v=|v/|)[-a-zA-Z0-9?&=_%]*
|
|
# YouTube music
|
|
\bmusic\.youtube\.com/youtubei/v1/browse(?:[?&]\w+=[-a-zA-Z0-9?&=_]*)
|
|
# YouTube tag
|
|
<\s*youtube\s+id=['"][-a-zA-Z0-9?_]*['"]
|
|
# YouTube image
|
|
\bimg\.youtube\.com/vi/[-a-zA-Z0-9?&=_]*
|
|
# Google Accounts
|
|
\baccounts.google.com/[-_/?=.:;+%&0-9a-zA-Z]*
|
|
# Google Analytics
|
|
\bgoogle-analytics\.com/collect.[-0-9a-zA-Z?%=&_.~]*
|
|
# Google APIs
|
|
\bgoogleapis\.(?:com|dev)/[a-z]+/(?:v\d+/|)[a-z]+/[-@:./?=\w+|&]+
|
|
# Google Storage
|
|
\b[-a-zA-Z0-9.]*\bstorage\d*\.googleapis\.com(?:/\S*|)
|
|
# Google Calendar
|
|
\bcalendar\.google\.com/calendar(?:/u/\d+|)/embed\?src=[@./?=\w&%]+
|
|
\w+\@group\.calendar\.google\.com\b
|
|
# Google DataStudio
|
|
\bdatastudio\.google\.com/(?:(?:c/|)u/\d+/|)(?:embed/|)(?:open|reporting|datasources|s)/[-0-9a-zA-Z]+(?:/page/[-0-9a-zA-Z]+|)
|
|
# The leading `/` here is as opposed to the `\b` above
|
|
# ... a short way to match `https://` or `http://` since most urls have one of those prefixes
|
|
# Google Docs
|
|
/docs\.google\.com/[a-z]+/(?:ccc\?key=\w+|(?:u/\d+|d/(?:e/|)[0-9a-zA-Z_-]+/)?(?:edit\?[-\w=#.]*|/\?[\w=&]*|))
|
|
# Google Drive
|
|
\bdrive\.google\.com/(?:file/d/|open)[-0-9a-zA-Z_?=]*
|
|
# Google Groups
|
|
\bgroups\.google\.com/(?:(?:forum/#!|d/)(?:msg|topics?|searchin)|a)/[^/\s"]+/[-a-zA-Z0-9$]+(?:/[-a-zA-Z0-9]+)*
|
|
# Google Maps
|
|
\bmaps\.google\.com/maps\?[\w&;=]*
|
|
# Google themes
|
|
themes\.googleusercontent\.com/static/fonts/[^/\s"]+/v\d+/[^.]+.
|
|
# Google CDN
|
|
\bclients2\.google(?:usercontent|)\.com[-0-9a-zA-Z/.]*
|
|
# Goo.gl
|
|
/goo\.gl/[a-zA-Z0-9]+
|
|
# Google Chrome Store
|
|
\bchrome\.google\.com/webstore/detail/[-\w]*(?:/\w*|)
|
|
# Google Books
|
|
\bgoogle\.(?:\w{2,4})/books(?:/\w+)*\?[-\w\d=&#.]*
|
|
# Google Fonts
|
|
\bfonts\.(?:googleapis|gstatic)\.com/[-/?=:;+&0-9a-zA-Z]*
|
|
# Google Forms
|
|
\bforms\.gle/\w+
|
|
# Google Scholar
|
|
\bscholar\.google\.com/citations\?user=[A-Za-z0-9_]+
|
|
# Google Colab Research Drive
|
|
\bcolab\.research\.google\.com/drive/[-0-9a-zA-Z_?=]*
|
|
|
|
# GitHub SHAs (api)
|
|
\bapi.github\.com/repos(?:/[^/\s"]+){3}/[0-9a-f]+\b
|
|
# GitHub SHAs (markdown)
|
|
(?:\[`?[0-9a-f]+`?\]\(https:/|)/(?:www\.|)github\.com(?:/[^/\s"]+){2,}(?:/[^/\s")]+)(?:[0-9a-f]+(?:[-0-9a-zA-Z/#.]*|)\b|)
|
|
# GitHub SHAs
|
|
\bgithub\.com(?:/[^/\s"]+){2}[@#][0-9a-f]+\b
|
|
# GitHub wiki
|
|
\bgithub\.com/(?:[^/]+/){2}wiki/(?:(?:[^/]+/|)_history|[^/]+(?:/_compare|)/[0-9a-f.]{40,})\b
|
|
# githubusercontent
|
|
/[-a-z0-9]+\.githubusercontent\.com/[-a-zA-Z0-9?&=_\/.]*
|
|
# githubassets
|
|
\bgithubassets.com/[0-9a-f]+(?:[-/\w.]+)
|
|
# gist github
|
|
\bgist\.github\.com/[^/\s"]+/[0-9a-f]+
|
|
# git.io
|
|
\bgit\.io/[0-9a-zA-Z]+
|
|
# GitHub JSON
|
|
"node_id": "[-a-zA-Z=;:/0-9+]*"
|
|
# Contributor
|
|
\[[^\]]+\]\(https://github\.com/[^/\s"]+\)
|
|
# GHSA
|
|
GHSA(?:-[0-9a-z]{4}){3}
|
|
|
|
# GitLab commit
|
|
\bgitlab\.[^/\s"]*/\S+/\S+/commit/[0-9a-f]{7,16}#[0-9a-f]{40}\b
|
|
# GitLab merge requests
|
|
\bgitlab\.[^/\s"]*/\S+/\S+/-/merge_requests/\d+/diffs#[0-9a-f]{40}\b
|
|
# GitLab uploads
|
|
\bgitlab\.[^/\s"]*/uploads/[-a-zA-Z=;:/0-9+]*
|
|
# GitLab commits
|
|
\bgitlab\.[^/\s"]*/(?:[^/\s"]+/){2}commits?/[0-9a-f]+\b
|
|
|
|
# binanace
|
|
accounts.binance.com/[a-z/]*oauth/authorize\?[-0-9a-zA-Z&%]*
|
|
|
|
# bitbucket diff
|
|
\bapi\.bitbucket\.org/\d+\.\d+/repositories/(?:[^/\s"]+/){2}diff(?:stat|)(?:/[^/\s"]+){2}:[0-9a-f]+
|
|
# bitbucket repositories commits
|
|
\bapi\.bitbucket\.org/\d+\.\d+/repositories/(?:[^/\s"]+/){2}commits?/[0-9a-f]+
|
|
# bitbucket commits
|
|
\bbitbucket\.org/(?:[^/\s"]+/){2}commits?/[0-9a-f]+
|
|
|
|
# bit.ly
|
|
\bbit\.ly/\w+
|
|
|
|
# bitrise
|
|
\bapp\.bitrise\.io/app/[0-9a-f]*/[\w.?=&]*
|
|
|
|
# bootstrapcdn.com
|
|
\bbootstrapcdn\.com/[-./\w]+
|
|
|
|
# cdn.cloudflare.com
|
|
\bcdnjs\.cloudflare\.com/[./\w]+
|
|
|
|
# circleci
|
|
\bcircleci\.com/gh(?:/[^/\s"]+){1,5}.[a-z]+\?[-0-9a-zA-Z=&]+
|
|
|
|
# gitter
|
|
\bgitter\.im(?:/[^/\s"]+){2}\?at=[0-9a-f]+
|
|
|
|
# gravatar
|
|
\bgravatar\.com/avatar/[0-9a-f]+
|
|
|
|
# ibm
|
|
[a-z.]*ibm\.com/[-_#=:%!?~.\\/\d\w]*
|
|
|
|
# imgur
|
|
\bimgur\.com/[^.]+
|
|
|
|
# Internet Archive
|
|
\barchive\.org/web/\d+/(?:[-\w.?,'/\\+&%$#_:]*)
|
|
|
|
# discord
|
|
/discord(?:app\.com|\.gg)/(?:invite/)?[a-zA-Z0-9]{7,}
|
|
|
|
# Disqus
|
|
\bdisqus\.com/[-\w/%.()!?&=_]*
|
|
|
|
# medium link
|
|
\blink\.medium\.com/[a-zA-Z0-9]+
|
|
# medium
|
|
\bmedium\.com/\@?[^/\s"]+/[-\w]+
|
|
|
|
# microsoft
|
|
\b(?:https?://|)(?:(?:download\.visualstudio|docs|msdn2?|research)\.microsoft|blogs\.msdn)\.com/[-_a-zA-Z0-9()=./%]*
|
|
# powerbi
|
|
\bapp\.powerbi\.com/reportEmbed/[^"' ]*
|
|
# vs devops
|
|
\bvisualstudio.com(?::443|)/[-\w/?=%&.]*
|
|
# microsoft store
|
|
\bmicrosoft\.com/store/apps/\w+
|
|
|
|
# mvnrepository.com
|
|
\bmvnrepository\.com/[-0-9a-z./]+
|
|
|
|
# now.sh
|
|
/[0-9a-z-.]+\.now\.sh\b
|
|
|
|
# oracle
|
|
\bdocs\.oracle\.com/[-0-9a-zA-Z./_?#&=]*
|
|
|
|
# chromatic.com
|
|
/\S+.chromatic.com\S*[")]
|
|
|
|
# codacy
|
|
\bapi\.codacy\.com/project/badge/Grade/[0-9a-f]+
|
|
|
|
# compai
|
|
\bcompai\.pub/v1/png/[0-9a-f]+
|
|
|
|
# mailgun api
|
|
\.api\.mailgun\.net/v3/domains/[0-9a-z]+\.mailgun.org/messages/[0-9a-zA-Z=@]*
|
|
# mailgun
|
|
\b[0-9a-z]+.mailgun.org
|
|
|
|
# /message-id/
|
|
/message-id/[-\w@./%]+
|
|
|
|
# Reddit
|
|
\breddit\.com/r/[/\w_]*
|
|
|
|
# requestb.in
|
|
\brequestb\.in/[0-9a-z]+
|
|
|
|
# sched
|
|
\b[a-z0-9]+\.sched\.com\b
|
|
|
|
# Slack url
|
|
slack://[a-zA-Z0-9?&=]+
|
|
# Slack
|
|
\bslack\.com/[-0-9a-zA-Z/_~?&=.]*
|
|
# Slack edge
|
|
\bslack-edge\.com/[-a-zA-Z0-9?&=%./]+
|
|
# Slack images
|
|
\bslack-imgs\.com/[-a-zA-Z0-9?&=%.]+
|
|
|
|
# shields.io
|
|
\bshields\.io/[-\w/%?=&.:+;,]*
|
|
|
|
# stackexchange -- https://stackexchange.com/feeds/sites
|
|
\b(?:askubuntu|serverfault|stack(?:exchange|overflow)|superuser).com/(?:questions/\w+/[-\w]+|a/)
|
|
|
|
# Sentry
|
|
[0-9a-f]{32}\@o\d+\.ingest\.sentry\.io\b
|
|
|
|
# Twitter markdown
|
|
\[\@[^[/\]:]*?\]\(https://twitter.com/[^/\s"')]*(?:/status/\d+(?:\?[-_0-9a-zA-Z&=]*|)|)\)
|
|
# Twitter hashtag
|
|
\btwitter\.com/hashtag/[\w?_=&]*
|
|
# Twitter status
|
|
\btwitter\.com/[^/\s"')]*(?:/status/\d+(?:\?[-_0-9a-zA-Z&=]*|)|)
|
|
# Twitter profile images
|
|
\btwimg\.com/profile_images/[_\w./]*
|
|
# Twitter media
|
|
\btwimg\.com/media/[-_\w./?=]*
|
|
# Twitter link shortened
|
|
\bt\.co/\w+
|
|
|
|
# facebook
|
|
\bfburl\.com/[0-9a-z_]+
|
|
# facebook CDN
|
|
\bfbcdn\.net/[\w/.,]*
|
|
# facebook watch
|
|
\bfb\.watch/[0-9A-Za-z]+
|
|
|
|
# dropbox
|
|
\bdropbox\.com/sh?/[^/\s"]+/[-0-9A-Za-z_.%?=&;]+
|
|
|
|
# ipfs protocol
|
|
ipfs://[0-9a-z]*
|
|
# ipfs url
|
|
/ipfs/[0-9a-z]*
|
|
|
|
# w3
|
|
\bw3\.org/[-0-9a-zA-Z/#.]+
|
|
|
|
# loom
|
|
\bloom\.com/embed/[0-9a-f]+
|
|
|
|
# regex101
|
|
\bregex101\.com/r/[^/\s"]+/\d+
|
|
|
|
# figma
|
|
\bfigma\.com/file(?:/[0-9a-zA-Z]+/)+
|
|
|
|
# freecodecamp.org
|
|
\bfreecodecamp\.org/[-\w/.]+
|
|
|
|
# image.tmdb.org
|
|
\bimage\.tmdb\.org/[/\w.]+
|
|
|
|
# mermaid
|
|
\bmermaid\.ink/img/[-\w]+|\bmermaid-js\.github\.io/mermaid-live-editor/#/edit/[-\w]+
|
|
|
|
# Wikipedia
|
|
\ben\.wikipedia\.org/wiki/[-\w%.#]+
|
|
|
|
# gitweb
|
|
[^"\s]+/gitweb/\S+;h=[0-9a-f]+
|
|
|
|
# HyperKitty lists
|
|
/archives/list/[^@/]+\@[^/\s"]*/message/[^/\s"]*/
|
|
|
|
# lists
|
|
/thread\.html/[^"\s]+
|
|
|
|
# list-management
|
|
\blist-manage\.com/subscribe(?:[?&](?:u|id)=[0-9a-f]+)+
|
|
|
|
# kubectl.kubernetes.io/last-applied-configuration
|
|
"kubectl.kubernetes.io/last-applied-configuration": ".*"
|
|
|
|
# pgp
|
|
\bgnupg\.net/pks/lookup[?&=0-9a-zA-Z]*
|
|
|
|
# Spotify
|
|
\bopen\.spotify\.com/embed/playlist/\w+
|
|
|
|
# Mastodon
|
|
\bmastodon\.[-a-z.]*/(?:media/|\@)[?&=0-9a-zA-Z_]*
|
|
|
|
# scastie
|
|
\bscastie\.scala-lang\.org/[^/]+/\w+
|
|
|
|
# images.unsplash.com
|
|
\bimages\.unsplash\.com/(?:(?:flagged|reserve)/|)[-\w./%?=%&.;]+
|
|
|
|
# pastebin
|
|
\bpastebin\.com/[\w/]+
|
|
|
|
# heroku
|
|
\b\w+\.heroku\.com/source/archive/\w+
|
|
|
|
# quip
|
|
\b\w+\.quip\.com/\w+(?:(?:#|/issues/)\w+)?
|
|
|
|
# badgen.net
|
|
\bbadgen\.net/badge/[^")\]'\s]+
|
|
|
|
# statuspage.io
|
|
\w+\.statuspage\.io\b
|
|
|
|
# media.giphy.com
|
|
\bmedia\.giphy\.com/media/[^/]+/[\w.?&=]+
|
|
|
|
# tinyurl
|
|
\btinyurl\.com/\w+
|
|
|
|
# getopts
|
|
\bgetopts\s+(?:"[^"]+"|'[^']+')
|
|
|
|
# ANSI color codes
|
|
(?:\\(?:u00|x)1b|\x1b)\[\d+(?:;\d+|)m
|
|
|
|
# URL escaped characters
|
|
\%[0-9A-F][A-F]
|
|
# IPv6
|
|
\b(?:[0-9a-fA-F]{0,4}:){3,7}[0-9a-fA-F]{0,4}\b
|
|
# c99 hex digits (not the full format, just one I've seen)
|
|
0x[0-9a-fA-F](?:\.[0-9a-fA-F]*|)[pP]
|
|
# Punycode
|
|
\bxn--[-0-9a-z]+
|
|
# sha
|
|
sha\d+:[0-9]*[a-f]{3,}[0-9a-f]*
|
|
# sha-... -- uses a fancy capture
|
|
(['"]|")[0-9a-f]{40,}\g{-1}
|
|
# hex runs
|
|
\b[0-9a-fA-F]{16,}\b
|
|
# hex in url queries
|
|
=[0-9a-fA-F]*?(?:[A-F]{3,}|[a-f]{3,})[0-9a-fA-F]*?&
|
|
# ssh
|
|
(?:ssh-\S+|-nistp256) [-a-zA-Z=;:/0-9+]{12,}
|
|
|
|
# PGP
|
|
\b(?:[0-9A-F]{4} ){9}[0-9A-F]{4}\b
|
|
# GPG keys
|
|
\b(?:[0-9A-F]{4} ){5}(?: [0-9A-F]{4}){5}\b
|
|
# Well known gpg keys
|
|
.well-known/openpgpkey/[\w./]+
|
|
|
|
# uuid:
|
|
\b[0-9a-fA-F]{8}-(?:[0-9a-fA-F]{4}-){3}[0-9a-fA-F]{12}\b
|
|
# hex digits including css/html color classes:
|
|
(?:[\\0][xX]|\\u|[uU]\+|#x?|\%23)[0-9_a-fA-FgGrR]*?[a-fA-FgGrR]{2,}[0-9_a-fA-FgGrR]*(?:[uUlL]{0,3}|u\d+)\b
|
|
# integrity
|
|
integrity="sha\d+-[-a-zA-Z=;:/0-9+]{40,}"
|
|
|
|
# https://www.gnu.org/software/groff/manual/groff.html
|
|
# man troff content
|
|
\\f[BCIPR]
|
|
# '
|
|
\\\(aq
|
|
|
|
# .desktop mime types
|
|
^MimeTypes?=.*$
|
|
# .desktop localized entries
|
|
^[A-Z][a-z]+\[[a-z]+\]=.*$
|
|
# Localized .desktop content
|
|
Name\[[^\]]+\]=.*
|
|
|
|
# IServiceProvider
|
|
\bI(?=(?:[A-Z][a-z]{2,})+\b)
|
|
|
|
# crypt
|
|
"\$2[ayb]\$.{56}"
|
|
|
|
# scrypt / argon
|
|
\$(?:scrypt|argon\d+[di]*)\$\S+
|
|
|
|
# Input to GitHub JSON
|
|
content: "[-a-zA-Z=;:/0-9+]*="
|
|
|
|
# Python stringprefix / binaryprefix
|
|
# Note that there's a high false positive rate, remove the `?=` and search for the regex to see if the matches seem like reasonable strings
|
|
(?<!')\b(?:B|BR|Br|F|FR|Fr|R|RB|RF|Rb|Rf|U|UR|Ur|b|bR|br|f|fR|fr|r|rB|rF|rb|rf|u|uR|ur)'(?:[A-Z]{3,}|[A-Z][a-z]{2,}|[a-z]{3,})
|
|
|
|
# Regular expressions for (P|p)assword
|
|
\([A-Z]\|[a-z]\)[a-z]+
|
|
|
|
# JavaScript regular expressions
|
|
# javascript test regex
|
|
/.*/[gim]*\.test\(
|
|
# javascript match regex
|
|
\.match\(/[^/\s"]*/[gim]*\s*
|
|
# javascript match regex
|
|
\.match\(/\\[b].*?/[gim]*\s*\)(?:;|$)
|
|
# javascript regex
|
|
^\s*/\\[b].*/[gim]*\s*(?:\)(?:;|$)|,$)
|
|
# javascript replace regex
|
|
\.replace\(/[^/\s"]*/[gim]*\s*,
|
|
|
|
# Go regular expressions
|
|
regexp?\.MustCompile\(`[^`]*`\)
|
|
|
|
# sed regular expressions
|
|
sed 's/(?:[^/]*?[a-zA-Z]{3,}[^/]*?/){2}
|
|
|
|
# go install
|
|
go install(?:\s+[a-z]+\.[-@\w/.]+)+
|
|
|
|
# kubernetes pod status lists
|
|
# https://kubernetes.io/docs/concepts/workloads/pods/pod-lifecycle/#pod-phase
|
|
\w+(?:-\w+)+\s+\d+/\d+\s+(?:Running|Pending|Succeeded|Failed|Unknown)\s+
|
|
|
|
# kubectl - pods in CrashLoopBackOff
|
|
\w+-[0-9a-f]+-\w+\s+\d+/\d+\s+CrashLoopBackOff\s+
|
|
|
|
# kubernetes object suffix
|
|
-[0-9a-f]{10}-\w{5}\s
|
|
|
|
# posthog secrets
|
|
posthog\.init\((['"])phc_[^"',]+\g{-1},
|
|
|
|
# xcode
|
|
|
|
# xcodeproject scenes
|
|
(?:Controller|ID|id)="\w{3}-\w{2}-\w{3}"
|
|
|
|
# xcode api botches
|
|
customObjectInstantitationMethod
|
|
|
|
# font awesome classes
|
|
\.fa-[-a-z0-9]+
|
|
|
|
# Update Lorem based on your content (requires `ge` and `w` from https://github.com/jsoref/spelling; and `review` from https://github.com/check-spelling/check-spelling/wiki/Looking-for-items-locally )
|
|
# grep '^[^#].*lorem' .github/actions/spelling/patterns.txt|perl -pne 's/.*i..\?://;s/\).*//' |tr '|' "\n"|sort -f |xargs -n1 ge|perl -pne 's/^[^:]*://'|sort -u|w|sed -e 's/ .*//'|w|review -
|
|
# Warning, while `(?i)` is very neat and fancy, if you have some binary files that aren't proper unicode, you might run into:
|
|
## Operation "substitution (s///)" returns its argument for non-Unicode code point 0x1C19AE (the code point will vary).
|
|
## You could manually change `(?i)X...` to use `[Xx]...`
|
|
## or you could add the files to your `excludes` file (a version after 0.0.19 should identify the file path)
|
|
# Lorem
|
|
(?:\w|\s|[,.])*\b(?i)(?:amet|consectetur|cursus|dolor|eros|ipsum|lacus|libero|ligula|lorem|magna|neque|nulla|suscipit|tempus)\b(?:\w|\s|[,.])*
|
|
|
|
# Non-English
|
|
[a-zA-Z]*[ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýÿĀāŁłŃńŅņŒœŚśŠšŜŝŸŽžź][a-zA-Z]{3}[a-zA-ZÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýÿĀāŁłŃńŅņŒœŚśŠšŜŝŸŽžź]*
|
|
|
|
# French
|
|
# This corpus only had capital letters, but you probably want lowercase ones as well.
|
|
\b[LN]'+[a-z]{2,}\b
|
|
|
|
# latex
|
|
\\(?:n(?:ew|ormal|osub)|r(?:enew)|t(?:able(?:of|)|he|itle))(?=[a-z]+)
|
|
|
|
# the negative lookahead here is to allow catching 'templatesz' as a misspelling
|
|
# but to otherwise recognize a Windows path with \templates\foo.template or similar:
|
|
\\(?:necessary|r(?:eport|esolve[dr]?|esult)|t(?:arget|emplates?))(?![a-z])
|
|
# ignore long runs of a single character:
|
|
\b([A-Za-z])\g{-1}{3,}\b
|
|
# Note that the next example is no longer necessary if you are using
|
|
# to match a string starting with a `#`, use a character-class:
|
|
[#]backwards
|
|
# version suffix <word>v#
|
|
(?:(?<=[A-Z]{2})V|(?<=[a-z]{2}|[A-Z]{2})v)\d+(?:\b|(?=[a-zA-Z_]))
|
|
# Compiler flags (Scala)
|
|
(?:^|[\t ,>"'`=(])-J-[DPWXY](?=[A-Z]{2,}|[A-Z][a-z]|[a-z]{2,})
|
|
# Compiler flags
|
|
#(?:^|[\t ,"'`=(])-[DPWXYLlf](?=[A-Z]{2,}|[A-Z][a-z]|[a-z]{2,})
|
|
|
|
# Compiler flags (linker)
|
|
,-B
|
|
# curl arguments
|
|
\b(?:\\n|)curl(?:\s+-[a-zA-Z]{1,2}\b)*(?:\s+-[a-zA-Z]{3,})(?:\s+-[a-zA-Z]+)*
|
|
# set arguments
|
|
\bset(?:\s+-[abefimouxE]{1,2})*\s+-[abefimouxE]{3,}(?:\s+-[abefimouxE]+)*
|
|
# tar arguments
|
|
\b(?:\\n|)g?tar(?:\.exe|)(?:(?:\s+--[-a-zA-Z]+|\s+-[a-zA-Z]+|\s[ABGJMOPRSUWZacdfh-pr-xz]+\b)(?:=[^ ]*|))+
|
|
# tput arguments -- https://man7.org/linux/man-pages/man5/terminfo.5.html -- technically they can be more than 5 chars long...
|
|
\btput\s+(?:(?:-[SV]|-T\s*\w+)\s+)*\w{3,5}\b
|
|
# macOS temp folders
|
|
/var/folders/\w\w/[+\w]+/(?:T|-Caches-)/
|