Initial commit

clentfort · clentfort · commit de2b575a5642 · 2016-04-12T20:54:32.000+02:00
diff --git a/.babelrc b/.babelrc
@@ -0,0 +1,9 @@
+{
+  "presets": [ 
+    "es2015",
+    "stage-0"
+  ],
+  "plugins": [
+    "transform-flow-strip-types"
+  ]
+}
diff --git a/.eslintignore b/.eslintignore
@@ -0,0 +1 @@
+**/__tests__/
diff --git a/.eslintrc b/.eslintrc
@@ -0,0 +1,12 @@
+{
+  "extends": "airbnb/base",
+  "parser": "babel-eslint",
+  "plugins": [
+    "flowtype"
+  ],
+  "rules": {
+    "no-param-reassign": ["error", { "props": false }],
+    "no-use-before-define": "off",
+    "flowtype/space-before-type-colon": ["warn", "never"],
+  }
+}
diff --git a/.flowconfig b/.flowconfig
@@ -0,0 +1,7 @@
+[ignore]
+
+[include]
+
+[libs]
+
+[options]
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,7 @@
+node_modules/
+ENV
+
+# Elastic Beanstalk Files
+.elasticbeanstalk/*
+!.elasticbeanstalk/*.cfg.yml
+!.elasticbeanstalk/*.global.yml
diff --git a/package.json b/package.json
@@ -0,0 +1,49 @@
+{
+  "name": "another-selector-parser",
+  "version": "0.0.1",
+  "description": "",
+  "main": "index.js",
+  "scripts": {
+    "test": "NODE_ENV=test ./node_modules/.bin/jest"
+  },
+  "repository": {
+    "type": "git",
+    "url": "clentfort/another-selector-parser.git"
+  },
+  "keywords": [
+    "css",
+    "selector",
+    "parser",
+    "css",
+    "selector",
+    "parser",
+    "css",
+    "parser",
+    "selector",
+    "parser"
+  ],
+  "author": "Christian Lentfort @_chris_lent_",
+  "license": "MIT",
+  "devDependencies": {
+    "babel": "^6.5.2",
+    "babel-jest": "^10.0.2",
+    "babel-plugin-transform-flow-strip-types": "^6.7.0",
+    "babel-polyfill": "^6.7.4",
+    "babel-preset-es2015": "^6.6.0",
+    "babel-preset-stage-0": "^6.5.0",
+    "eslint": "^2.7.0",
+    "eslint-config-airbnb": "^6.2.0",
+    "eslint-plugin-flowtype": "^2.2.6",
+    "jest-cli": "^0.10.2"
+  },
+  "jest": {
+    "scriptPreprocessor": "<rootDir>/node_modules/babel-jest",
+    "testFileExtensions": [
+      "js"
+    ],
+    "moduleFileExtensions": [
+      "js",
+      "json"
+    ]
+  }
+}
diff --git a/src/tokenizer/__tests__/index.js b/src/tokenizer/__tests__/index.js
@@ -0,0 +1,25 @@
+jest.unmock('../');
+jest.unmock('../types');
+
+import tokenize from '../';
+import { types as tt } from '../types';
+
+describe('tokenize', () => {
+  it('returns EOF for empty input', () => {
+    const { value, done } = tokenize('').next();
+    expect(done).toBe(true);
+    expect(value).toEqual({ type: tt.eof });
+  });
+
+  it('is down after returning EOF', () => {
+    const tokenizer = tokenize('');
+    tokenizer.next();
+    expect(tokenizer.next().done).toBe(true);
+  });
+
+  it('ignores any comments', () => {
+    let { value, done } = tokenize('/*abc*/').next();
+    expect(done).toBe(true);
+    expect(value).toEqual({ type: tt.eof });
+  });
+});
diff --git a/src/tokenizer/index.js b/src/tokenizer/index.js
@@ -0,0 +1,203 @@
+/* @flow */
+import { types as tt } from './types';
+
+import type { TokenType } from './types';
+
+type Token = {
+  type: TokenType;
+  value?: any;
+};
+
+export default function *tokenize(input: string): Generator<Token, Token, void> {
+  // Current position in the input string
+  let position = 0;
+
+  while (position < input.length) {
+    // Current char we are looking at
+    let currentChar = input[position];
+
+    let wasWhitespace = false;
+    if (isWhitespace(currentChar)) {
+      currentChar = input[++position];
+      while (isWhitespace(currentChar)) {
+        currentChar = input[++position];
+      }
+      yield { type: tt.whitespace };
+      // No continue needed here since we consumed all whitespace and a guaranteed to find something meaningful now
+    }
+
+    if (currentChar === '/') {
+      currentChar = input[++position];
+      if (currentChar === '*') {
+        // Inside a comment
+        console.log('Inside a comment');
+        currentChar = input[++position];
+        let nextChar = input[position + 1];
+        console.log('Current Char', currentChar);
+        console.log('Next Char', nextChar);
+        console.log('Start while');
+        while (!(currentChar === '*' && nextChar === '/')) {
+          currentChar = input[++position];
+          nextChar = input[position + 1];
+          console.log('Current Char', currentChar);
+          console.log('Next Char', nextChar);
+        }
+        console.log('End while');
+        currentChar = input[position + 2];
+        position += 2;
+        console.log('Current Char', currentChar);
+      } else {
+        throw new UnexpectedCharacterError('/', currentChar);
+      }
+    }
+
+    if (currentChar === '[') {
+      yield { type: tt.bracketL };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === ']') {
+      yield { type: tt.bracketR };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === ':') {
+      yield { type: tt.colon };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === ',') {
+      yield { type: tt.comma };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '.') {
+      yield { type: tt.dot };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '>') {
+      yield { type: tt.greater };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '#') {
+      yield { type: tt.hash };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '(') {
+      yield { type: tt.parenL };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === ')') {
+      yield { type: tt.parenR };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '%') {
+      yield { type: tt.percentage };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '+') {
+      yield { type: tt.plus };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '~') {
+      yield { type: tt.tilde };
+      ++position;
+      continue;
+    }
+
+    if (currentChar === '|') {
+      currentChar= input[++position];
+      if (currentChar === '=') {
+        yield { type: tt.dashmatch };
+        ++position;
+        continue;
+      } else {
+        throw new UnexpectedCharacterError(currentChar, '=');
+      }
+    }
+
+    if (currentChar === '~') {
+      currentChar= input[++position];
+      if (currentChar === '=') {
+        yield { type: tt.includes };
+        ++position;
+        continue;
+      } else {
+        throw new UnexpectedCharacterError(currentChar, '=');
+      }
+    }
+
+    if (currentChar === '^') {
+      currentChar= input[++position];
+      if (currentChar === '=') {
+        yield { type: tt.prefixmatch };
+        ++position;
+        continue;
+      } else {
+        throw new UnexpectedCharacterError(currentChar, '=');
+      }
+    }
+
+    if (currentChar === '*') {
+      currentChar= input[++position];
+      if (currentChar === '=') {
+        yield { type: tt.substringmatch };
+        ++position;
+        continue;
+      } else {
+        throw new UnexpectedCharacterError(currentChar, '=');
+      }
+    }
+
+    if (currentChar === '$') {
+      currentChar= input[++position];
+      if (currentChar === '=') {
+        yield { type: tt.suffixmatch };
+        ++position;
+        continue;
+      } else {
+        throw new UnexpectedCharacterError(currentChar, '=');
+      }
+    }
+
+  }
+
+  return {
+    type: tt.eof,
+  };
+}
+
+function isWhitespace(char: string) {
+  return (char === ' ' || char === "\t" || char === "\r" || char === "\n" || char === "\f");
+}
+
+
+class UnexpectedCharacterError extends Error {
+  constructor(actual, expected) {
+    super(`Unexpected char "${actual}", expected "${expected}".`);
+  }
+}
+
+class UnexpectedEofError extends Error {
+  constructor(expected) {
+    super(`Unexpected end of input, expected "${expected}".`);
+  }
+}
diff --git a/src/tokenizer/types.js b/src/tokenizer/types.js
@@ -0,0 +1,33 @@
+/* @flow */
+export class TokenType {
+  label: string;
+
+  constructor(label: string) {
+    this.label = label;
+  }
+}
+
+export const types = {
+  bracketL: new TokenType('['),
+  bracketR: new TokenType(']'),
+  colon: new TokenType(':'),
+  comma: new TokenType(','),
+  dashmatch: new TokenType('|='),
+  dot: new TokenType('.'),
+  greater: new TokenType('>'),
+  hash: new TokenType('#'),
+  ident: new TokenType('ident'),
+  includes: new TokenType('~='),
+  num: new TokenType('num'),
+  parenL: new TokenType('('),
+  parenR: new TokenType(')'),
+  percentage: new TokenType('%'),
+  plus: new TokenType('+'),
+  prefixmatch: new TokenType('^='),
+  string: new TokenType('string'),
+  substringmatch: new TokenType('*='),
+  suffixmatch: new TokenType('$='),
+  tilde: new TokenType('~'),
+  whitespace: new TokenType('whitespace'),
+  eof: new TokenType('EOF'),
+};