diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.g4 b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.g4 new file mode 100644 index 00000000000..6fc4b8c1465 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.g4 @@ -0,0 +1,285 @@ +grammar CASS; + +// -------------------------- +// 1) Top-Level Structure +// -------------------------- + +// Parse one or more function definitions. +prog + : statement+ EOF + ; + +functionDefinition + : typeSpec primaryExpression '(' parameterList? ')' compoundStatement + ; + +// A block of statements in braces +compoundStatement + : '{' statement* '}' + ; + + +// -------------------------- +// 2) Declarations & Statements +// -------------------------- + +statement + + : declarationStatement + | forBlockStatement + | forSingleStatement + | whileBlockStatement + | whileSingleStatement + | ifBlockStatement + | ifSingleStatement + | returnStatement + | switchStatement + | caseStatement + | expressionStatement + | functionDefinition + | includeStatement + ; + +declarationStatement + : typeSpec POINTER* (primaryExpression || arrayDeclarator) ('=' (expression || nullptr || emptyInitializer))? ';'? + ; + +forBlockStatement + : 'for' '(' (declarationStatement || assignmentExpression) ';' logicalOrExpression ';' unaryExpression ')' compoundStatement + ; + +forSingleStatement + : 'for' '(' (declarationStatement?|| assignmentExpression) ';' logicalOrExpression ';' unaryExpression ')' statement + ; + +conditionClause + : logicalOrExpression + ; + +whileBlockStatement + : 'while' '(' conditionClause ')' compoundStatement + ; + +whileSingleStatement + : 'while' '(' conditionClause ')' statement + ; + +ifBlockStatement + : 'if' '(' conditionClause ')' compoundStatement elseClause? + ; + +ifSingleStatement + : 'if' '(' conditionClause ')' statement elseClause? + ; + +elseClause + : 'else' (compoundStatement | ifBlockStatement | statement) + ; + +switchStatement + : 'switch' '(' conditionClause ')' compoundStatement + ; + +caseStatement + : ('case' | defaultExpression) primaryExpression? ':' statement* breakExpression? + ; + +functionCall + : ID '(' argumentList? ')' + ; + +arrayDeclarator + : primaryExpression '[' primaryExpression? ']' + ; + +listInitializer + : '{' primaryExpression (',' primaryExpression)* '}' + ; + +emptyInitializer + : '{' '}' + ; + +nullptr + : 'nullptr' + ; + +argumentList + : expression (',' expression)* + ; + +returnStatement + : 'return' expression? ';' + ; + +expressionStatement + : expression ';' + ; + +includeStatement + : 'include' STRING + ; +// -------------------------- +// 3) Parameters & Types +// -------------------------- + +parameterList + : parameter (',' parameter)* + ; + +parameter + : typeSpec primaryExpression + ; + +typeSpec + : 'int' + | 'float' + | 'double' + | 'void' + ; + +// -------------------------- +// 4) Expressions +// -------------------------- + +// For simplicity, we let "expression" wrap typical C operator precedences. + + +expression + : assignmentExpression + | functionCall + ; + +defaultExpression + : 'default' + ; + +breakExpression + : 'break' ';' + ; + +assignmentExpression + : unaryExpression assignmentOperator assignmentExpression nullptr? emptyInitializer? + | logicalOrExpression + ; + +unaryExpression + : ('++' | '--') unaryExpression + | unaryExpression ('++' | '--') + | pointerExpression + | primaryExpression + | listInitializer + ; + +comparingExpression + : '>' + | '<' + | '<=' + | '>=' + ; + +primaryExpression + : ID + | INT + | FLOAT + | CHAR + | STRING + | BOOL + | functionCall + | '(' expression ')' + ; + +pointerExpression + : '&' primaryExpression + | '*' primaryExpression + ; + +assignmentOperator + : '=' + | '+=' + | '-=' + | '*=' + | '/=' + ; + +logicalOrExpression + : logicalAndExpression ('||' logicalAndExpression)* + ; + +logicalAndExpression + : equalityExpression ('&&' equalityExpression)* + ; + +equalityExpression + : relationalExpression (( '==' | '!=' ) relationalExpression)* + ; + +relationalExpression + : additiveExpression (( '<' | '>' | '<=' | '>=' ) additiveExpression)* + ; + +additiveExpression + : multiplicativeExpression (( '+' | '-' ) multiplicativeExpression)* + ; + +multiplicativeExpression + : unaryExpression (( '*' | '/' | '%' ) unaryExpression)* + ; + +operationExpression + : additiveExpression // Handles '+' and '-' precedence + | multiplicativeExpression // Handles '*' and '/' + ; + +// -------------------------- +// 5) Lexer Rules +// -------------------------- + +SL_COMMENT + : '//' ~[\r\n]* -> skip + ; + +ML_COMMENT + : '/*' .*? '*/' -> skip + ; + +ID + : [a-zA-Z_] [a-zA-Z0-9_]* + ; + +INT + : '-'? [0-9]+ + ; + +BOOL + : 'true' + | 'false' + ; + +FLOAT + : [0-9]+ '.' [0-9]+ ([eE] [+-]? [0-9]+)? + | '.' [0-9]+ ([eE] [+-]? [0-9]+)? + | [0-9]+ ([eE] [+-]? [0-9]+) + ; + +CHAR + : '"'[a-zA-Z] '"' + ; + +POINTER + : '*' + ; + + +STRING + : '"' (ESC_SEQ | ~["\\])* '"' // A string starts and ends with double quotes + ; + +fragment ESC_SEQ + : '\\' [btnfr"'\\] // Escape sequences for backslash, single quote, double quote, etc. + ; + +// Skip whitespace and newlines +WS + : [ \t\r\n]+ -> skip + ; diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.interp b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.interp new file mode 100644 index 00000000000..69658b30c9b --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.interp @@ -0,0 +1,162 @@ +token literal names: +null +'(' +')' +'{' +'}' +'=' +';' +'for' +'while' +'if' +'else' +'switch' +'case' +':' +'[' +']' +',' +'nullptr' +'return' +'include' +'int' +'float' +'double' +'void' +'default' +'break' +'++' +'--' +'>' +'<' +'<=' +'>=' +'&' +'+=' +'-=' +'*=' +'/=' +'||' +'&&' +'==' +'!=' +'+' +'-' +'/' +'%' +null +null +null +null +null +null +null +'*' +null +null + +token symbolic names: +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +SL_COMMENT +ML_COMMENT +ID +INT +BOOL +FLOAT +CHAR +POINTER +STRING +WS + +rule names: +prog +functionDefinition +compoundStatement +statement +declarationStatement +forBlockStatement +forSingleStatement +conditionClause +whileBlockStatement +whileSingleStatement +ifBlockStatement +ifSingleStatement +elseClause +switchStatement +caseStatement +functionCall +arrayDeclarator +listInitializer +emptyInitializer +nullptr +argumentList +returnStatement +expressionStatement +includeStatement +parameterList +parameter +typeSpec +expression +defaultExpression +breakExpression +assignmentExpression +unaryExpression +comparingExpression +primaryExpression +pointerExpression +assignmentOperator +logicalOrExpression +logicalAndExpression +equalityExpression +relationalExpression +additiveExpression +multiplicativeExpression +operationExpression + + +atn: +[4, 1, 54, 415, 2, 0, 7, 0, 2, 1, 7, 1, 2, 2, 7, 2, 2, 3, 7, 3, 2, 4, 7, 4, 2, 5, 7, 5, 2, 6, 7, 6, 2, 7, 7, 7, 2, 8, 7, 8, 2, 9, 7, 9, 2, 10, 7, 10, 2, 11, 7, 11, 2, 12, 7, 12, 2, 13, 7, 13, 2, 14, 7, 14, 2, 15, 7, 15, 2, 16, 7, 16, 2, 17, 7, 17, 2, 18, 7, 18, 2, 19, 7, 19, 2, 20, 7, 20, 2, 21, 7, 21, 2, 22, 7, 22, 2, 23, 7, 23, 2, 24, 7, 24, 2, 25, 7, 25, 2, 26, 7, 26, 2, 27, 7, 27, 2, 28, 7, 28, 2, 29, 7, 29, 2, 30, 7, 30, 2, 31, 7, 31, 2, 32, 7, 32, 2, 33, 7, 33, 2, 34, 7, 34, 2, 35, 7, 35, 2, 36, 7, 36, 2, 37, 7, 37, 2, 38, 7, 38, 2, 39, 7, 39, 2, 40, 7, 40, 2, 41, 7, 41, 2, 42, 7, 42, 1, 0, 4, 0, 88, 8, 0, 11, 0, 12, 0, 89, 1, 0, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 98, 8, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 2, 5, 2, 105, 8, 2, 10, 2, 12, 2, 108, 9, 2, 1, 2, 1, 2, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 1, 3, 3, 3, 125, 8, 3, 1, 4, 1, 4, 5, 4, 129, 8, 4, 10, 4, 12, 4, 132, 9, 4, 1, 4, 1, 4, 1, 4, 3, 4, 137, 8, 4, 1, 4, 1, 4, 1, 4, 1, 4, 1, 4, 1, 4, 3, 4, 145, 8, 4, 3, 4, 147, 8, 4, 1, 4, 3, 4, 150, 8, 4, 1, 5, 1, 5, 1, 5, 1, 5, 1, 5, 3, 5, 157, 8, 5, 1, 5, 1, 5, 1, 5, 1, 5, 1, 5, 1, 5, 1, 5, 1, 6, 1, 6, 1, 6, 3, 6, 169, 8, 6, 1, 6, 1, 6, 3, 6, 173, 8, 6, 1, 6, 1, 6, 1, 6, 1, 6, 1, 6, 1, 6, 1, 6, 1, 7, 1, 7, 1, 8, 1, 8, 1, 8, 1, 8, 1, 8, 1, 8, 1, 9, 1, 9, 1, 9, 1, 9, 1, 9, 1, 9, 1, 10, 1, 10, 1, 10, 1, 10, 1, 10, 1, 10, 3, 10, 202, 8, 10, 1, 11, 1, 11, 1, 11, 1, 11, 1, 11, 1, 11, 3, 11, 210, 8, 11, 1, 12, 1, 12, 1, 12, 1, 12, 3, 12, 216, 8, 12, 1, 13, 1, 13, 1, 13, 1, 13, 1, 13, 1, 13, 1, 14, 1, 14, 3, 14, 226, 8, 14, 1, 14, 3, 14, 229, 8, 14, 1, 14, 1, 14, 5, 14, 233, 8, 14, 10, 14, 12, 14, 236, 9, 14, 1, 14, 3, 14, 239, 8, 14, 1, 15, 1, 15, 1, 15, 3, 15, 244, 8, 15, 1, 15, 1, 15, 1, 16, 1, 16, 1, 16, 3, 16, 251, 8, 16, 1, 16, 1, 16, 1, 17, 1, 17, 1, 17, 1, 17, 5, 17, 259, 8, 17, 10, 17, 12, 17, 262, 9, 17, 1, 17, 1, 17, 1, 18, 1, 18, 1, 18, 1, 19, 1, 19, 1, 20, 1, 20, 1, 20, 5, 20, 274, 8, 20, 10, 20, 12, 20, 277, 9, 20, 1, 21, 1, 21, 3, 21, 281, 8, 21, 1, 21, 1, 21, 1, 22, 1, 22, 1, 22, 1, 23, 1, 23, 1, 23, 1, 24, 1, 24, 1, 24, 5, 24, 294, 8, 24, 10, 24, 12, 24, 297, 9, 24, 1, 25, 1, 25, 1, 25, 1, 26, 1, 26, 1, 27, 1, 27, 3, 27, 306, 8, 27, 1, 28, 1, 28, 1, 29, 1, 29, 1, 29, 1, 30, 1, 30, 1, 30, 1, 30, 3, 30, 317, 8, 30, 1, 30, 3, 30, 320, 8, 30, 1, 30, 3, 30, 323, 8, 30, 1, 31, 1, 31, 1, 31, 1, 31, 1, 31, 1, 31, 3, 31, 331, 8, 31, 1, 31, 1, 31, 5, 31, 335, 8, 31, 10, 31, 12, 31, 338, 9, 31, 1, 32, 1, 32, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 1, 33, 3, 33, 353, 8, 33, 1, 34, 1, 34, 1, 34, 1, 34, 3, 34, 359, 8, 34, 1, 35, 1, 35, 1, 36, 1, 36, 1, 36, 5, 36, 366, 8, 36, 10, 36, 12, 36, 369, 9, 36, 1, 37, 1, 37, 1, 37, 5, 37, 374, 8, 37, 10, 37, 12, 37, 377, 9, 37, 1, 38, 1, 38, 1, 38, 5, 38, 382, 8, 38, 10, 38, 12, 38, 385, 9, 38, 1, 39, 1, 39, 1, 39, 5, 39, 390, 8, 39, 10, 39, 12, 39, 393, 9, 39, 1, 40, 1, 40, 1, 40, 5, 40, 398, 8, 40, 10, 40, 12, 40, 401, 9, 40, 1, 41, 1, 41, 1, 41, 5, 41, 406, 8, 41, 10, 41, 12, 41, 409, 9, 41, 1, 42, 1, 42, 3, 42, 413, 8, 42, 1, 42, 0, 1, 62, 43, 0, 2, 4, 6, 8, 10, 12, 14, 16, 18, 20, 22, 24, 26, 28, 30, 32, 34, 36, 38, 40, 42, 44, 46, 48, 50, 52, 54, 56, 58, 60, 62, 64, 66, 68, 70, 72, 74, 76, 78, 80, 82, 84, 0, 7, 1, 0, 20, 23, 1, 0, 26, 27, 1, 0, 28, 31, 2, 0, 5, 5, 33, 36, 1, 0, 39, 40, 1, 0, 41, 42, 2, 0, 43, 44, 52, 52, 437, 0, 87, 1, 0, 0, 0, 2, 93, 1, 0, 0, 0, 4, 102, 1, 0, 0, 0, 6, 124, 1, 0, 0, 0, 8, 126, 1, 0, 0, 0, 10, 151, 1, 0, 0, 0, 12, 165, 1, 0, 0, 0, 14, 181, 1, 0, 0, 0, 16, 183, 1, 0, 0, 0, 18, 189, 1, 0, 0, 0, 20, 195, 1, 0, 0, 0, 22, 203, 1, 0, 0, 0, 24, 211, 1, 0, 0, 0, 26, 217, 1, 0, 0, 0, 28, 225, 1, 0, 0, 0, 30, 240, 1, 0, 0, 0, 32, 247, 1, 0, 0, 0, 34, 254, 1, 0, 0, 0, 36, 265, 1, 0, 0, 0, 38, 268, 1, 0, 0, 0, 40, 270, 1, 0, 0, 0, 42, 278, 1, 0, 0, 0, 44, 284, 1, 0, 0, 0, 46, 287, 1, 0, 0, 0, 48, 290, 1, 0, 0, 0, 50, 298, 1, 0, 0, 0, 52, 301, 1, 0, 0, 0, 54, 305, 1, 0, 0, 0, 56, 307, 1, 0, 0, 0, 58, 309, 1, 0, 0, 0, 60, 322, 1, 0, 0, 0, 62, 330, 1, 0, 0, 0, 64, 339, 1, 0, 0, 0, 66, 352, 1, 0, 0, 0, 68, 358, 1, 0, 0, 0, 70, 360, 1, 0, 0, 0, 72, 362, 1, 0, 0, 0, 74, 370, 1, 0, 0, 0, 76, 378, 1, 0, 0, 0, 78, 386, 1, 0, 0, 0, 80, 394, 1, 0, 0, 0, 82, 402, 1, 0, 0, 0, 84, 412, 1, 0, 0, 0, 86, 88, 3, 6, 3, 0, 87, 86, 1, 0, 0, 0, 88, 89, 1, 0, 0, 0, 89, 87, 1, 0, 0, 0, 89, 90, 1, 0, 0, 0, 90, 91, 1, 0, 0, 0, 91, 92, 5, 0, 0, 1, 92, 1, 1, 0, 0, 0, 93, 94, 3, 52, 26, 0, 94, 95, 3, 66, 33, 0, 95, 97, 5, 1, 0, 0, 96, 98, 3, 48, 24, 0, 97, 96, 1, 0, 0, 0, 97, 98, 1, 0, 0, 0, 98, 99, 1, 0, 0, 0, 99, 100, 5, 2, 0, 0, 100, 101, 3, 4, 2, 0, 101, 3, 1, 0, 0, 0, 102, 106, 5, 3, 0, 0, 103, 105, 3, 6, 3, 0, 104, 103, 1, 0, 0, 0, 105, 108, 1, 0, 0, 0, 106, 104, 1, 0, 0, 0, 106, 107, 1, 0, 0, 0, 107, 109, 1, 0, 0, 0, 108, 106, 1, 0, 0, 0, 109, 110, 5, 4, 0, 0, 110, 5, 1, 0, 0, 0, 111, 125, 3, 8, 4, 0, 112, 125, 3, 10, 5, 0, 113, 125, 3, 12, 6, 0, 114, 125, 3, 16, 8, 0, 115, 125, 3, 18, 9, 0, 116, 125, 3, 20, 10, 0, 117, 125, 3, 22, 11, 0, 118, 125, 3, 42, 21, 0, 119, 125, 3, 26, 13, 0, 120, 125, 3, 28, 14, 0, 121, 125, 3, 44, 22, 0, 122, 125, 3, 2, 1, 0, 123, 125, 3, 46, 23, 0, 124, 111, 1, 0, 0, 0, 124, 112, 1, 0, 0, 0, 124, 113, 1, 0, 0, 0, 124, 114, 1, 0, 0, 0, 124, 115, 1, 0, 0, 0, 124, 116, 1, 0, 0, 0, 124, 117, 1, 0, 0, 0, 124, 118, 1, 0, 0, 0, 124, 119, 1, 0, 0, 0, 124, 120, 1, 0, 0, 0, 124, 121, 1, 0, 0, 0, 124, 122, 1, 0, 0, 0, 124, 123, 1, 0, 0, 0, 125, 7, 1, 0, 0, 0, 126, 130, 3, 52, 26, 0, 127, 129, 5, 52, 0, 0, 128, 127, 1, 0, 0, 0, 129, 132, 1, 0, 0, 0, 130, 128, 1, 0, 0, 0, 130, 131, 1, 0, 0, 0, 131, 136, 1, 0, 0, 0, 132, 130, 1, 0, 0, 0, 133, 137, 3, 66, 33, 0, 134, 137, 1, 0, 0, 0, 135, 137, 3, 32, 16, 0, 136, 133, 1, 0, 0, 0, 136, 134, 1, 0, 0, 0, 136, 135, 1, 0, 0, 0, 137, 146, 1, 0, 0, 0, 138, 144, 5, 5, 0, 0, 139, 145, 3, 54, 27, 0, 140, 145, 1, 0, 0, 0, 141, 145, 3, 38, 19, 0, 142, 145, 1, 0, 0, 0, 143, 145, 3, 36, 18, 0, 144, 139, 1, 0, 0, 0, 144, 140, 1, 0, 0, 0, 144, 141, 1, 0, 0, 0, 144, 142, 1, 0, 0, 0, 144, 143, 1, 0, 0, 0, 145, 147, 1, 0, 0, 0, 146, 138, 1, 0, 0, 0, 146, 147, 1, 0, 0, 0, 147, 149, 1, 0, 0, 0, 148, 150, 5, 6, 0, 0, 149, 148, 1, 0, 0, 0, 149, 150, 1, 0, 0, 0, 150, 9, 1, 0, 0, 0, 151, 152, 5, 7, 0, 0, 152, 156, 5, 1, 0, 0, 153, 157, 3, 8, 4, 0, 154, 157, 1, 0, 0, 0, 155, 157, 3, 60, 30, 0, 156, 153, 1, 0, 0, 0, 156, 154, 1, 0, 0, 0, 156, 155, 1, 0, 0, 0, 157, 158, 1, 0, 0, 0, 158, 159, 5, 6, 0, 0, 159, 160, 3, 72, 36, 0, 160, 161, 5, 6, 0, 0, 161, 162, 3, 62, 31, 0, 162, 163, 5, 2, 0, 0, 163, 164, 3, 4, 2, 0, 164, 11, 1, 0, 0, 0, 165, 166, 5, 7, 0, 0, 166, 172, 5, 1, 0, 0, 167, 169, 3, 8, 4, 0, 168, 167, 1, 0, 0, 0, 168, 169, 1, 0, 0, 0, 169, 173, 1, 0, 0, 0, 170, 173, 1, 0, 0, 0, 171, 173, 3, 60, 30, 0, 172, 168, 1, 0, 0, 0, 172, 170, 1, 0, 0, 0, 172, 171, 1, 0, 0, 0, 173, 174, 1, 0, 0, 0, 174, 175, 5, 6, 0, 0, 175, 176, 3, 72, 36, 0, 176, 177, 5, 6, 0, 0, 177, 178, 3, 62, 31, 0, 178, 179, 5, 2, 0, 0, 179, 180, 3, 6, 3, 0, 180, 13, 1, 0, 0, 0, 181, 182, 3, 72, 36, 0, 182, 15, 1, 0, 0, 0, 183, 184, 5, 8, 0, 0, 184, 185, 5, 1, 0, 0, 185, 186, 3, 14, 7, 0, 186, 187, 5, 2, 0, 0, 187, 188, 3, 4, 2, 0, 188, 17, 1, 0, 0, 0, 189, 190, 5, 8, 0, 0, 190, 191, 5, 1, 0, 0, 191, 192, 3, 14, 7, 0, 192, 193, 5, 2, 0, 0, 193, 194, 3, 6, 3, 0, 194, 19, 1, 0, 0, 0, 195, 196, 5, 9, 0, 0, 196, 197, 5, 1, 0, 0, 197, 198, 3, 14, 7, 0, 198, 199, 5, 2, 0, 0, 199, 201, 3, 4, 2, 0, 200, 202, 3, 24, 12, 0, 201, 200, 1, 0, 0, 0, 201, 202, 1, 0, 0, 0, 202, 21, 1, 0, 0, 0, 203, 204, 5, 9, 0, 0, 204, 205, 5, 1, 0, 0, 205, 206, 3, 14, 7, 0, 206, 207, 5, 2, 0, 0, 207, 209, 3, 6, 3, 0, 208, 210, 3, 24, 12, 0, 209, 208, 1, 0, 0, 0, 209, 210, 1, 0, 0, 0, 210, 23, 1, 0, 0, 0, 211, 215, 5, 10, 0, 0, 212, 216, 3, 4, 2, 0, 213, 216, 3, 20, 10, 0, 214, 216, 3, 6, 3, 0, 215, 212, 1, 0, 0, 0, 215, 213, 1, 0, 0, 0, 215, 214, 1, 0, 0, 0, 216, 25, 1, 0, 0, 0, 217, 218, 5, 11, 0, 0, 218, 219, 5, 1, 0, 0, 219, 220, 3, 14, 7, 0, 220, 221, 5, 2, 0, 0, 221, 222, 3, 4, 2, 0, 222, 27, 1, 0, 0, 0, 223, 226, 5, 12, 0, 0, 224, 226, 3, 56, 28, 0, 225, 223, 1, 0, 0, 0, 225, 224, 1, 0, 0, 0, 226, 228, 1, 0, 0, 0, 227, 229, 3, 66, 33, 0, 228, 227, 1, 0, 0, 0, 228, 229, 1, 0, 0, 0, 229, 230, 1, 0, 0, 0, 230, 234, 5, 13, 0, 0, 231, 233, 3, 6, 3, 0, 232, 231, 1, 0, 0, 0, 233, 236, 1, 0, 0, 0, 234, 232, 1, 0, 0, 0, 234, 235, 1, 0, 0, 0, 235, 238, 1, 0, 0, 0, 236, 234, 1, 0, 0, 0, 237, 239, 3, 58, 29, 0, 238, 237, 1, 0, 0, 0, 238, 239, 1, 0, 0, 0, 239, 29, 1, 0, 0, 0, 240, 241, 5, 47, 0, 0, 241, 243, 5, 1, 0, 0, 242, 244, 3, 40, 20, 0, 243, 242, 1, 0, 0, 0, 243, 244, 1, 0, 0, 0, 244, 245, 1, 0, 0, 0, 245, 246, 5, 2, 0, 0, 246, 31, 1, 0, 0, 0, 247, 248, 3, 66, 33, 0, 248, 250, 5, 14, 0, 0, 249, 251, 3, 66, 33, 0, 250, 249, 1, 0, 0, 0, 250, 251, 1, 0, 0, 0, 251, 252, 1, 0, 0, 0, 252, 253, 5, 15, 0, 0, 253, 33, 1, 0, 0, 0, 254, 255, 5, 3, 0, 0, 255, 260, 3, 66, 33, 0, 256, 257, 5, 16, 0, 0, 257, 259, 3, 66, 33, 0, 258, 256, 1, 0, 0, 0, 259, 262, 1, 0, 0, 0, 260, 258, 1, 0, 0, 0, 260, 261, 1, 0, 0, 0, 261, 263, 1, 0, 0, 0, 262, 260, 1, 0, 0, 0, 263, 264, 5, 4, 0, 0, 264, 35, 1, 0, 0, 0, 265, 266, 5, 3, 0, 0, 266, 267, 5, 4, 0, 0, 267, 37, 1, 0, 0, 0, 268, 269, 5, 17, 0, 0, 269, 39, 1, 0, 0, 0, 270, 275, 3, 54, 27, 0, 271, 272, 5, 16, 0, 0, 272, 274, 3, 54, 27, 0, 273, 271, 1, 0, 0, 0, 274, 277, 1, 0, 0, 0, 275, 273, 1, 0, 0, 0, 275, 276, 1, 0, 0, 0, 276, 41, 1, 0, 0, 0, 277, 275, 1, 0, 0, 0, 278, 280, 5, 18, 0, 0, 279, 281, 3, 54, 27, 0, 280, 279, 1, 0, 0, 0, 280, 281, 1, 0, 0, 0, 281, 282, 1, 0, 0, 0, 282, 283, 5, 6, 0, 0, 283, 43, 1, 0, 0, 0, 284, 285, 3, 54, 27, 0, 285, 286, 5, 6, 0, 0, 286, 45, 1, 0, 0, 0, 287, 288, 5, 19, 0, 0, 288, 289, 5, 53, 0, 0, 289, 47, 1, 0, 0, 0, 290, 295, 3, 50, 25, 0, 291, 292, 5, 16, 0, 0, 292, 294, 3, 50, 25, 0, 293, 291, 1, 0, 0, 0, 294, 297, 1, 0, 0, 0, 295, 293, 1, 0, 0, 0, 295, 296, 1, 0, 0, 0, 296, 49, 1, 0, 0, 0, 297, 295, 1, 0, 0, 0, 298, 299, 3, 52, 26, 0, 299, 300, 3, 66, 33, 0, 300, 51, 1, 0, 0, 0, 301, 302, 7, 0, 0, 0, 302, 53, 1, 0, 0, 0, 303, 306, 3, 60, 30, 0, 304, 306, 3, 30, 15, 0, 305, 303, 1, 0, 0, 0, 305, 304, 1, 0, 0, 0, 306, 55, 1, 0, 0, 0, 307, 308, 5, 24, 0, 0, 308, 57, 1, 0, 0, 0, 309, 310, 5, 25, 0, 0, 310, 311, 5, 6, 0, 0, 311, 59, 1, 0, 0, 0, 312, 313, 3, 62, 31, 0, 313, 314, 3, 70, 35, 0, 314, 316, 3, 60, 30, 0, 315, 317, 3, 38, 19, 0, 316, 315, 1, 0, 0, 0, 316, 317, 1, 0, 0, 0, 317, 319, 1, 0, 0, 0, 318, 320, 3, 36, 18, 0, 319, 318, 1, 0, 0, 0, 319, 320, 1, 0, 0, 0, 320, 323, 1, 0, 0, 0, 321, 323, 3, 72, 36, 0, 322, 312, 1, 0, 0, 0, 322, 321, 1, 0, 0, 0, 323, 61, 1, 0, 0, 0, 324, 325, 6, 31, -1, 0, 325, 326, 7, 1, 0, 0, 326, 331, 3, 62, 31, 5, 327, 331, 3, 68, 34, 0, 328, 331, 3, 66, 33, 0, 329, 331, 3, 34, 17, 0, 330, 324, 1, 0, 0, 0, 330, 327, 1, 0, 0, 0, 330, 328, 1, 0, 0, 0, 330, 329, 1, 0, 0, 0, 331, 336, 1, 0, 0, 0, 332, 333, 10, 4, 0, 0, 333, 335, 7, 1, 0, 0, 334, 332, 1, 0, 0, 0, 335, 338, 1, 0, 0, 0, 336, 334, 1, 0, 0, 0, 336, 337, 1, 0, 0, 0, 337, 63, 1, 0, 0, 0, 338, 336, 1, 0, 0, 0, 339, 340, 7, 2, 0, 0, 340, 65, 1, 0, 0, 0, 341, 353, 5, 47, 0, 0, 342, 353, 5, 48, 0, 0, 343, 353, 5, 50, 0, 0, 344, 353, 5, 51, 0, 0, 345, 353, 5, 53, 0, 0, 346, 353, 5, 49, 0, 0, 347, 353, 3, 30, 15, 0, 348, 349, 5, 1, 0, 0, 349, 350, 3, 54, 27, 0, 350, 351, 5, 2, 0, 0, 351, 353, 1, 0, 0, 0, 352, 341, 1, 0, 0, 0, 352, 342, 1, 0, 0, 0, 352, 343, 1, 0, 0, 0, 352, 344, 1, 0, 0, 0, 352, 345, 1, 0, 0, 0, 352, 346, 1, 0, 0, 0, 352, 347, 1, 0, 0, 0, 352, 348, 1, 0, 0, 0, 353, 67, 1, 0, 0, 0, 354, 355, 5, 32, 0, 0, 355, 359, 3, 66, 33, 0, 356, 357, 5, 52, 0, 0, 357, 359, 3, 66, 33, 0, 358, 354, 1, 0, 0, 0, 358, 356, 1, 0, 0, 0, 359, 69, 1, 0, 0, 0, 360, 361, 7, 3, 0, 0, 361, 71, 1, 0, 0, 0, 362, 367, 3, 74, 37, 0, 363, 364, 5, 37, 0, 0, 364, 366, 3, 74, 37, 0, 365, 363, 1, 0, 0, 0, 366, 369, 1, 0, 0, 0, 367, 365, 1, 0, 0, 0, 367, 368, 1, 0, 0, 0, 368, 73, 1, 0, 0, 0, 369, 367, 1, 0, 0, 0, 370, 375, 3, 76, 38, 0, 371, 372, 5, 38, 0, 0, 372, 374, 3, 76, 38, 0, 373, 371, 1, 0, 0, 0, 374, 377, 1, 0, 0, 0, 375, 373, 1, 0, 0, 0, 375, 376, 1, 0, 0, 0, 376, 75, 1, 0, 0, 0, 377, 375, 1, 0, 0, 0, 378, 383, 3, 78, 39, 0, 379, 380, 7, 4, 0, 0, 380, 382, 3, 78, 39, 0, 381, 379, 1, 0, 0, 0, 382, 385, 1, 0, 0, 0, 383, 381, 1, 0, 0, 0, 383, 384, 1, 0, 0, 0, 384, 77, 1, 0, 0, 0, 385, 383, 1, 0, 0, 0, 386, 391, 3, 80, 40, 0, 387, 388, 7, 2, 0, 0, 388, 390, 3, 80, 40, 0, 389, 387, 1, 0, 0, 0, 390, 393, 1, 0, 0, 0, 391, 389, 1, 0, 0, 0, 391, 392, 1, 0, 0, 0, 392, 79, 1, 0, 0, 0, 393, 391, 1, 0, 0, 0, 394, 399, 3, 82, 41, 0, 395, 396, 7, 5, 0, 0, 396, 398, 3, 82, 41, 0, 397, 395, 1, 0, 0, 0, 398, 401, 1, 0, 0, 0, 399, 397, 1, 0, 0, 0, 399, 400, 1, 0, 0, 0, 400, 81, 1, 0, 0, 0, 401, 399, 1, 0, 0, 0, 402, 407, 3, 62, 31, 0, 403, 404, 7, 6, 0, 0, 404, 406, 3, 62, 31, 0, 405, 403, 1, 0, 0, 0, 406, 409, 1, 0, 0, 0, 407, 405, 1, 0, 0, 0, 407, 408, 1, 0, 0, 0, 408, 83, 1, 0, 0, 0, 409, 407, 1, 0, 0, 0, 410, 413, 3, 80, 40, 0, 411, 413, 3, 82, 41, 0, 412, 410, 1, 0, 0, 0, 412, 411, 1, 0, 0, 0, 413, 85, 1, 0, 0, 0, 40, 89, 97, 106, 124, 130, 136, 144, 146, 149, 156, 168, 172, 201, 209, 215, 225, 228, 234, 238, 243, 250, 260, 275, 280, 295, 305, 316, 319, 322, 330, 336, 352, 358, 367, 375, 383, 391, 399, 407, 412] \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.tokens b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.tokens new file mode 100644 index 00000000000..ffe14a736f0 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS.tokens @@ -0,0 +1,99 @@ +T__0=1 +T__1=2 +T__2=3 +T__3=4 +T__4=5 +T__5=6 +T__6=7 +T__7=8 +T__8=9 +T__9=10 +T__10=11 +T__11=12 +T__12=13 +T__13=14 +T__14=15 +T__15=16 +T__16=17 +T__17=18 +T__18=19 +T__19=20 +T__20=21 +T__21=22 +T__22=23 +T__23=24 +T__24=25 +T__25=26 +T__26=27 +T__27=28 +T__28=29 +T__29=30 +T__30=31 +T__31=32 +T__32=33 +T__33=34 +T__34=35 +T__35=36 +T__36=37 +T__37=38 +T__38=39 +T__39=40 +T__40=41 +T__41=42 +T__42=43 +T__43=44 +SL_COMMENT=45 +ML_COMMENT=46 +ID=47 +INT=48 +BOOL=49 +FLOAT=50 +CHAR=51 +POINTER=52 +STRING=53 +WS=54 +'('=1 +')'=2 +'{'=3 +'}'=4 +'='=5 +';'=6 +'for'=7 +'while'=8 +'if'=9 +'else'=10 +'switch'=11 +'case'=12 +':'=13 +'['=14 +']'=15 +','=16 +'nullptr'=17 +'return'=18 +'include'=19 +'int'=20 +'float'=21 +'double'=22 +'void'=23 +'default'=24 +'break'=25 +'++'=26 +'--'=27 +'>'=28 +'<'=29 +'<='=30 +'>='=31 +'&'=32 +'+='=33 +'-='=34 +'*='=35 +'/='=36 +'||'=37 +'&&'=38 +'=='=39 +'!='=40 +'+'=41 +'-'=42 +'/'=43 +'%'=44 +'*'=52 diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.interp b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.interp new file mode 100644 index 00000000000..315deca7ee1 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.interp @@ -0,0 +1,180 @@ +token literal names: +null +'(' +')' +'{' +'}' +'=' +';' +'for' +'while' +'if' +'else' +'switch' +'case' +':' +'[' +']' +',' +'nullptr' +'return' +'include' +'int' +'float' +'double' +'void' +'default' +'break' +'++' +'--' +'>' +'<' +'<=' +'>=' +'&' +'+=' +'-=' +'*=' +'/=' +'||' +'&&' +'==' +'!=' +'+' +'-' +'/' +'%' +null +null +null +null +null +null +null +'*' +null +null + +token symbolic names: +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +null +SL_COMMENT +ML_COMMENT +ID +INT +BOOL +FLOAT +CHAR +POINTER +STRING +WS + +rule names: +T__0 +T__1 +T__2 +T__3 +T__4 +T__5 +T__6 +T__7 +T__8 +T__9 +T__10 +T__11 +T__12 +T__13 +T__14 +T__15 +T__16 +T__17 +T__18 +T__19 +T__20 +T__21 +T__22 +T__23 +T__24 +T__25 +T__26 +T__27 +T__28 +T__29 +T__30 +T__31 +T__32 +T__33 +T__34 +T__35 +T__36 +T__37 +T__38 +T__39 +T__40 +T__41 +T__42 +T__43 +SL_COMMENT +ML_COMMENT +ID +INT +BOOL +FLOAT +CHAR +POINTER +STRING +ESC_SEQ +WS + +channel names: +DEFAULT_TOKEN_CHANNEL +HIDDEN + +mode names: +DEFAULT_MODE + +atn: +[4, 0, 54, 402, 6, -1, 2, 0, 7, 0, 2, 1, 7, 1, 2, 2, 7, 2, 2, 3, 7, 3, 2, 4, 7, 4, 2, 5, 7, 5, 2, 6, 7, 6, 2, 7, 7, 7, 2, 8, 7, 8, 2, 9, 7, 9, 2, 10, 7, 10, 2, 11, 7, 11, 2, 12, 7, 12, 2, 13, 7, 13, 2, 14, 7, 14, 2, 15, 7, 15, 2, 16, 7, 16, 2, 17, 7, 17, 2, 18, 7, 18, 2, 19, 7, 19, 2, 20, 7, 20, 2, 21, 7, 21, 2, 22, 7, 22, 2, 23, 7, 23, 2, 24, 7, 24, 2, 25, 7, 25, 2, 26, 7, 26, 2, 27, 7, 27, 2, 28, 7, 28, 2, 29, 7, 29, 2, 30, 7, 30, 2, 31, 7, 31, 2, 32, 7, 32, 2, 33, 7, 33, 2, 34, 7, 34, 2, 35, 7, 35, 2, 36, 7, 36, 2, 37, 7, 37, 2, 38, 7, 38, 2, 39, 7, 39, 2, 40, 7, 40, 2, 41, 7, 41, 2, 42, 7, 42, 2, 43, 7, 43, 2, 44, 7, 44, 2, 45, 7, 45, 2, 46, 7, 46, 2, 47, 7, 47, 2, 48, 7, 48, 2, 49, 7, 49, 2, 50, 7, 50, 2, 51, 7, 51, 2, 52, 7, 52, 2, 53, 7, 53, 2, 54, 7, 54, 1, 0, 1, 0, 1, 1, 1, 1, 1, 2, 1, 2, 1, 3, 1, 3, 1, 4, 1, 4, 1, 5, 1, 5, 1, 6, 1, 6, 1, 6, 1, 6, 1, 7, 1, 7, 1, 7, 1, 7, 1, 7, 1, 7, 1, 8, 1, 8, 1, 8, 1, 9, 1, 9, 1, 9, 1, 9, 1, 9, 1, 10, 1, 10, 1, 10, 1, 10, 1, 10, 1, 10, 1, 10, 1, 11, 1, 11, 1, 11, 1, 11, 1, 11, 1, 12, 1, 12, 1, 13, 1, 13, 1, 14, 1, 14, 1, 15, 1, 15, 1, 16, 1, 16, 1, 16, 1, 16, 1, 16, 1, 16, 1, 16, 1, 16, 1, 17, 1, 17, 1, 17, 1, 17, 1, 17, 1, 17, 1, 17, 1, 18, 1, 18, 1, 18, 1, 18, 1, 18, 1, 18, 1, 18, 1, 18, 1, 19, 1, 19, 1, 19, 1, 19, 1, 20, 1, 20, 1, 20, 1, 20, 1, 20, 1, 20, 1, 21, 1, 21, 1, 21, 1, 21, 1, 21, 1, 21, 1, 21, 1, 22, 1, 22, 1, 22, 1, 22, 1, 22, 1, 23, 1, 23, 1, 23, 1, 23, 1, 23, 1, 23, 1, 23, 1, 23, 1, 24, 1, 24, 1, 24, 1, 24, 1, 24, 1, 24, 1, 25, 1, 25, 1, 25, 1, 26, 1, 26, 1, 26, 1, 27, 1, 27, 1, 28, 1, 28, 1, 29, 1, 29, 1, 29, 1, 30, 1, 30, 1, 30, 1, 31, 1, 31, 1, 32, 1, 32, 1, 32, 1, 33, 1, 33, 1, 33, 1, 34, 1, 34, 1, 34, 1, 35, 1, 35, 1, 35, 1, 36, 1, 36, 1, 36, 1, 37, 1, 37, 1, 37, 1, 38, 1, 38, 1, 38, 1, 39, 1, 39, 1, 39, 1, 40, 1, 40, 1, 41, 1, 41, 1, 42, 1, 42, 1, 43, 1, 43, 1, 44, 1, 44, 1, 44, 1, 44, 5, 44, 275, 8, 44, 10, 44, 12, 44, 278, 9, 44, 1, 44, 1, 44, 1, 45, 1, 45, 1, 45, 1, 45, 5, 45, 286, 8, 45, 10, 45, 12, 45, 289, 9, 45, 1, 45, 1, 45, 1, 45, 1, 45, 1, 45, 1, 46, 1, 46, 5, 46, 298, 8, 46, 10, 46, 12, 46, 301, 9, 46, 1, 47, 3, 47, 304, 8, 47, 1, 47, 4, 47, 307, 8, 47, 11, 47, 12, 47, 308, 1, 48, 1, 48, 1, 48, 1, 48, 1, 48, 1, 48, 1, 48, 1, 48, 1, 48, 3, 48, 320, 8, 48, 1, 49, 4, 49, 323, 8, 49, 11, 49, 12, 49, 324, 1, 49, 1, 49, 4, 49, 329, 8, 49, 11, 49, 12, 49, 330, 1, 49, 1, 49, 3, 49, 335, 8, 49, 1, 49, 4, 49, 338, 8, 49, 11, 49, 12, 49, 339, 3, 49, 342, 8, 49, 1, 49, 1, 49, 4, 49, 346, 8, 49, 11, 49, 12, 49, 347, 1, 49, 1, 49, 3, 49, 352, 8, 49, 1, 49, 4, 49, 355, 8, 49, 11, 49, 12, 49, 356, 3, 49, 359, 8, 49, 1, 49, 4, 49, 362, 8, 49, 11, 49, 12, 49, 363, 1, 49, 1, 49, 3, 49, 368, 8, 49, 1, 49, 4, 49, 371, 8, 49, 11, 49, 12, 49, 372, 3, 49, 375, 8, 49, 1, 50, 1, 50, 1, 50, 1, 50, 1, 51, 1, 51, 1, 52, 1, 52, 1, 52, 5, 52, 386, 8, 52, 10, 52, 12, 52, 389, 9, 52, 1, 52, 1, 52, 1, 53, 1, 53, 1, 53, 1, 54, 4, 54, 397, 8, 54, 11, 54, 12, 54, 398, 1, 54, 1, 54, 1, 287, 0, 55, 1, 1, 3, 2, 5, 3, 7, 4, 9, 5, 11, 6, 13, 7, 15, 8, 17, 9, 19, 10, 21, 11, 23, 12, 25, 13, 27, 14, 29, 15, 31, 16, 33, 17, 35, 18, 37, 19, 39, 20, 41, 21, 43, 22, 45, 23, 47, 24, 49, 25, 51, 26, 53, 27, 55, 28, 57, 29, 59, 30, 61, 31, 63, 32, 65, 33, 67, 34, 69, 35, 71, 36, 73, 37, 75, 38, 77, 39, 79, 40, 81, 41, 83, 42, 85, 43, 87, 44, 89, 45, 91, 46, 93, 47, 95, 48, 97, 49, 99, 50, 101, 51, 103, 52, 105, 53, 107, 0, 109, 54, 1, 0, 10, 2, 0, 10, 10, 13, 13, 3, 0, 65, 90, 95, 95, 97, 122, 4, 0, 48, 57, 65, 90, 95, 95, 97, 122, 1, 0, 48, 57, 2, 0, 69, 69, 101, 101, 2, 0, 43, 43, 45, 45, 2, 0, 65, 90, 97, 122, 2, 0, 34, 34, 92, 92, 8, 0, 34, 34, 39, 39, 92, 92, 98, 98, 102, 102, 110, 110, 114, 114, 116, 116, 3, 0, 9, 10, 13, 13, 32, 32, 423, 0, 1, 1, 0, 0, 0, 0, 3, 1, 0, 0, 0, 0, 5, 1, 0, 0, 0, 0, 7, 1, 0, 0, 0, 0, 9, 1, 0, 0, 0, 0, 11, 1, 0, 0, 0, 0, 13, 1, 0, 0, 0, 0, 15, 1, 0, 0, 0, 0, 17, 1, 0, 0, 0, 0, 19, 1, 0, 0, 0, 0, 21, 1, 0, 0, 0, 0, 23, 1, 0, 0, 0, 0, 25, 1, 0, 0, 0, 0, 27, 1, 0, 0, 0, 0, 29, 1, 0, 0, 0, 0, 31, 1, 0, 0, 0, 0, 33, 1, 0, 0, 0, 0, 35, 1, 0, 0, 0, 0, 37, 1, 0, 0, 0, 0, 39, 1, 0, 0, 0, 0, 41, 1, 0, 0, 0, 0, 43, 1, 0, 0, 0, 0, 45, 1, 0, 0, 0, 0, 47, 1, 0, 0, 0, 0, 49, 1, 0, 0, 0, 0, 51, 1, 0, 0, 0, 0, 53, 1, 0, 0, 0, 0, 55, 1, 0, 0, 0, 0, 57, 1, 0, 0, 0, 0, 59, 1, 0, 0, 0, 0, 61, 1, 0, 0, 0, 0, 63, 1, 0, 0, 0, 0, 65, 1, 0, 0, 0, 0, 67, 1, 0, 0, 0, 0, 69, 1, 0, 0, 0, 0, 71, 1, 0, 0, 0, 0, 73, 1, 0, 0, 0, 0, 75, 1, 0, 0, 0, 0, 77, 1, 0, 0, 0, 0, 79, 1, 0, 0, 0, 0, 81, 1, 0, 0, 0, 0, 83, 1, 0, 0, 0, 0, 85, 1, 0, 0, 0, 0, 87, 1, 0, 0, 0, 0, 89, 1, 0, 0, 0, 0, 91, 1, 0, 0, 0, 0, 93, 1, 0, 0, 0, 0, 95, 1, 0, 0, 0, 0, 97, 1, 0, 0, 0, 0, 99, 1, 0, 0, 0, 0, 101, 1, 0, 0, 0, 0, 103, 1, 0, 0, 0, 0, 105, 1, 0, 0, 0, 0, 109, 1, 0, 0, 0, 1, 111, 1, 0, 0, 0, 3, 113, 1, 0, 0, 0, 5, 115, 1, 0, 0, 0, 7, 117, 1, 0, 0, 0, 9, 119, 1, 0, 0, 0, 11, 121, 1, 0, 0, 0, 13, 123, 1, 0, 0, 0, 15, 127, 1, 0, 0, 0, 17, 133, 1, 0, 0, 0, 19, 136, 1, 0, 0, 0, 21, 141, 1, 0, 0, 0, 23, 148, 1, 0, 0, 0, 25, 153, 1, 0, 0, 0, 27, 155, 1, 0, 0, 0, 29, 157, 1, 0, 0, 0, 31, 159, 1, 0, 0, 0, 33, 161, 1, 0, 0, 0, 35, 169, 1, 0, 0, 0, 37, 176, 1, 0, 0, 0, 39, 184, 1, 0, 0, 0, 41, 188, 1, 0, 0, 0, 43, 194, 1, 0, 0, 0, 45, 201, 1, 0, 0, 0, 47, 206, 1, 0, 0, 0, 49, 214, 1, 0, 0, 0, 51, 220, 1, 0, 0, 0, 53, 223, 1, 0, 0, 0, 55, 226, 1, 0, 0, 0, 57, 228, 1, 0, 0, 0, 59, 230, 1, 0, 0, 0, 61, 233, 1, 0, 0, 0, 63, 236, 1, 0, 0, 0, 65, 238, 1, 0, 0, 0, 67, 241, 1, 0, 0, 0, 69, 244, 1, 0, 0, 0, 71, 247, 1, 0, 0, 0, 73, 250, 1, 0, 0, 0, 75, 253, 1, 0, 0, 0, 77, 256, 1, 0, 0, 0, 79, 259, 1, 0, 0, 0, 81, 262, 1, 0, 0, 0, 83, 264, 1, 0, 0, 0, 85, 266, 1, 0, 0, 0, 87, 268, 1, 0, 0, 0, 89, 270, 1, 0, 0, 0, 91, 281, 1, 0, 0, 0, 93, 295, 1, 0, 0, 0, 95, 303, 1, 0, 0, 0, 97, 319, 1, 0, 0, 0, 99, 374, 1, 0, 0, 0, 101, 376, 1, 0, 0, 0, 103, 380, 1, 0, 0, 0, 105, 382, 1, 0, 0, 0, 107, 392, 1, 0, 0, 0, 109, 396, 1, 0, 0, 0, 111, 112, 5, 40, 0, 0, 112, 2, 1, 0, 0, 0, 113, 114, 5, 41, 0, 0, 114, 4, 1, 0, 0, 0, 115, 116, 5, 123, 0, 0, 116, 6, 1, 0, 0, 0, 117, 118, 5, 125, 0, 0, 118, 8, 1, 0, 0, 0, 119, 120, 5, 61, 0, 0, 120, 10, 1, 0, 0, 0, 121, 122, 5, 59, 0, 0, 122, 12, 1, 0, 0, 0, 123, 124, 5, 102, 0, 0, 124, 125, 5, 111, 0, 0, 125, 126, 5, 114, 0, 0, 126, 14, 1, 0, 0, 0, 127, 128, 5, 119, 0, 0, 128, 129, 5, 104, 0, 0, 129, 130, 5, 105, 0, 0, 130, 131, 5, 108, 0, 0, 131, 132, 5, 101, 0, 0, 132, 16, 1, 0, 0, 0, 133, 134, 5, 105, 0, 0, 134, 135, 5, 102, 0, 0, 135, 18, 1, 0, 0, 0, 136, 137, 5, 101, 0, 0, 137, 138, 5, 108, 0, 0, 138, 139, 5, 115, 0, 0, 139, 140, 5, 101, 0, 0, 140, 20, 1, 0, 0, 0, 141, 142, 5, 115, 0, 0, 142, 143, 5, 119, 0, 0, 143, 144, 5, 105, 0, 0, 144, 145, 5, 116, 0, 0, 145, 146, 5, 99, 0, 0, 146, 147, 5, 104, 0, 0, 147, 22, 1, 0, 0, 0, 148, 149, 5, 99, 0, 0, 149, 150, 5, 97, 0, 0, 150, 151, 5, 115, 0, 0, 151, 152, 5, 101, 0, 0, 152, 24, 1, 0, 0, 0, 153, 154, 5, 58, 0, 0, 154, 26, 1, 0, 0, 0, 155, 156, 5, 91, 0, 0, 156, 28, 1, 0, 0, 0, 157, 158, 5, 93, 0, 0, 158, 30, 1, 0, 0, 0, 159, 160, 5, 44, 0, 0, 160, 32, 1, 0, 0, 0, 161, 162, 5, 110, 0, 0, 162, 163, 5, 117, 0, 0, 163, 164, 5, 108, 0, 0, 164, 165, 5, 108, 0, 0, 165, 166, 5, 112, 0, 0, 166, 167, 5, 116, 0, 0, 167, 168, 5, 114, 0, 0, 168, 34, 1, 0, 0, 0, 169, 170, 5, 114, 0, 0, 170, 171, 5, 101, 0, 0, 171, 172, 5, 116, 0, 0, 172, 173, 5, 117, 0, 0, 173, 174, 5, 114, 0, 0, 174, 175, 5, 110, 0, 0, 175, 36, 1, 0, 0, 0, 176, 177, 5, 105, 0, 0, 177, 178, 5, 110, 0, 0, 178, 179, 5, 99, 0, 0, 179, 180, 5, 108, 0, 0, 180, 181, 5, 117, 0, 0, 181, 182, 5, 100, 0, 0, 182, 183, 5, 101, 0, 0, 183, 38, 1, 0, 0, 0, 184, 185, 5, 105, 0, 0, 185, 186, 5, 110, 0, 0, 186, 187, 5, 116, 0, 0, 187, 40, 1, 0, 0, 0, 188, 189, 5, 102, 0, 0, 189, 190, 5, 108, 0, 0, 190, 191, 5, 111, 0, 0, 191, 192, 5, 97, 0, 0, 192, 193, 5, 116, 0, 0, 193, 42, 1, 0, 0, 0, 194, 195, 5, 100, 0, 0, 195, 196, 5, 111, 0, 0, 196, 197, 5, 117, 0, 0, 197, 198, 5, 98, 0, 0, 198, 199, 5, 108, 0, 0, 199, 200, 5, 101, 0, 0, 200, 44, 1, 0, 0, 0, 201, 202, 5, 118, 0, 0, 202, 203, 5, 111, 0, 0, 203, 204, 5, 105, 0, 0, 204, 205, 5, 100, 0, 0, 205, 46, 1, 0, 0, 0, 206, 207, 5, 100, 0, 0, 207, 208, 5, 101, 0, 0, 208, 209, 5, 102, 0, 0, 209, 210, 5, 97, 0, 0, 210, 211, 5, 117, 0, 0, 211, 212, 5, 108, 0, 0, 212, 213, 5, 116, 0, 0, 213, 48, 1, 0, 0, 0, 214, 215, 5, 98, 0, 0, 215, 216, 5, 114, 0, 0, 216, 217, 5, 101, 0, 0, 217, 218, 5, 97, 0, 0, 218, 219, 5, 107, 0, 0, 219, 50, 1, 0, 0, 0, 220, 221, 5, 43, 0, 0, 221, 222, 5, 43, 0, 0, 222, 52, 1, 0, 0, 0, 223, 224, 5, 45, 0, 0, 224, 225, 5, 45, 0, 0, 225, 54, 1, 0, 0, 0, 226, 227, 5, 62, 0, 0, 227, 56, 1, 0, 0, 0, 228, 229, 5, 60, 0, 0, 229, 58, 1, 0, 0, 0, 230, 231, 5, 60, 0, 0, 231, 232, 5, 61, 0, 0, 232, 60, 1, 0, 0, 0, 233, 234, 5, 62, 0, 0, 234, 235, 5, 61, 0, 0, 235, 62, 1, 0, 0, 0, 236, 237, 5, 38, 0, 0, 237, 64, 1, 0, 0, 0, 238, 239, 5, 43, 0, 0, 239, 240, 5, 61, 0, 0, 240, 66, 1, 0, 0, 0, 241, 242, 5, 45, 0, 0, 242, 243, 5, 61, 0, 0, 243, 68, 1, 0, 0, 0, 244, 245, 5, 42, 0, 0, 245, 246, 5, 61, 0, 0, 246, 70, 1, 0, 0, 0, 247, 248, 5, 47, 0, 0, 248, 249, 5, 61, 0, 0, 249, 72, 1, 0, 0, 0, 250, 251, 5, 124, 0, 0, 251, 252, 5, 124, 0, 0, 252, 74, 1, 0, 0, 0, 253, 254, 5, 38, 0, 0, 254, 255, 5, 38, 0, 0, 255, 76, 1, 0, 0, 0, 256, 257, 5, 61, 0, 0, 257, 258, 5, 61, 0, 0, 258, 78, 1, 0, 0, 0, 259, 260, 5, 33, 0, 0, 260, 261, 5, 61, 0, 0, 261, 80, 1, 0, 0, 0, 262, 263, 5, 43, 0, 0, 263, 82, 1, 0, 0, 0, 264, 265, 5, 45, 0, 0, 265, 84, 1, 0, 0, 0, 266, 267, 5, 47, 0, 0, 267, 86, 1, 0, 0, 0, 268, 269, 5, 37, 0, 0, 269, 88, 1, 0, 0, 0, 270, 271, 5, 47, 0, 0, 271, 272, 5, 47, 0, 0, 272, 276, 1, 0, 0, 0, 273, 275, 8, 0, 0, 0, 274, 273, 1, 0, 0, 0, 275, 278, 1, 0, 0, 0, 276, 274, 1, 0, 0, 0, 276, 277, 1, 0, 0, 0, 277, 279, 1, 0, 0, 0, 278, 276, 1, 0, 0, 0, 279, 280, 6, 44, 0, 0, 280, 90, 1, 0, 0, 0, 281, 282, 5, 47, 0, 0, 282, 283, 5, 42, 0, 0, 283, 287, 1, 0, 0, 0, 284, 286, 9, 0, 0, 0, 285, 284, 1, 0, 0, 0, 286, 289, 1, 0, 0, 0, 287, 288, 1, 0, 0, 0, 287, 285, 1, 0, 0, 0, 288, 290, 1, 0, 0, 0, 289, 287, 1, 0, 0, 0, 290, 291, 5, 42, 0, 0, 291, 292, 5, 47, 0, 0, 292, 293, 1, 0, 0, 0, 293, 294, 6, 45, 0, 0, 294, 92, 1, 0, 0, 0, 295, 299, 7, 1, 0, 0, 296, 298, 7, 2, 0, 0, 297, 296, 1, 0, 0, 0, 298, 301, 1, 0, 0, 0, 299, 297, 1, 0, 0, 0, 299, 300, 1, 0, 0, 0, 300, 94, 1, 0, 0, 0, 301, 299, 1, 0, 0, 0, 302, 304, 5, 45, 0, 0, 303, 302, 1, 0, 0, 0, 303, 304, 1, 0, 0, 0, 304, 306, 1, 0, 0, 0, 305, 307, 7, 3, 0, 0, 306, 305, 1, 0, 0, 0, 307, 308, 1, 0, 0, 0, 308, 306, 1, 0, 0, 0, 308, 309, 1, 0, 0, 0, 309, 96, 1, 0, 0, 0, 310, 311, 5, 116, 0, 0, 311, 312, 5, 114, 0, 0, 312, 313, 5, 117, 0, 0, 313, 320, 5, 101, 0, 0, 314, 315, 5, 102, 0, 0, 315, 316, 5, 97, 0, 0, 316, 317, 5, 108, 0, 0, 317, 318, 5, 115, 0, 0, 318, 320, 5, 101, 0, 0, 319, 310, 1, 0, 0, 0, 319, 314, 1, 0, 0, 0, 320, 98, 1, 0, 0, 0, 321, 323, 7, 3, 0, 0, 322, 321, 1, 0, 0, 0, 323, 324, 1, 0, 0, 0, 324, 322, 1, 0, 0, 0, 324, 325, 1, 0, 0, 0, 325, 326, 1, 0, 0, 0, 326, 328, 5, 46, 0, 0, 327, 329, 7, 3, 0, 0, 328, 327, 1, 0, 0, 0, 329, 330, 1, 0, 0, 0, 330, 328, 1, 0, 0, 0, 330, 331, 1, 0, 0, 0, 331, 341, 1, 0, 0, 0, 332, 334, 7, 4, 0, 0, 333, 335, 7, 5, 0, 0, 334, 333, 1, 0, 0, 0, 334, 335, 1, 0, 0, 0, 335, 337, 1, 0, 0, 0, 336, 338, 7, 3, 0, 0, 337, 336, 1, 0, 0, 0, 338, 339, 1, 0, 0, 0, 339, 337, 1, 0, 0, 0, 339, 340, 1, 0, 0, 0, 340, 342, 1, 0, 0, 0, 341, 332, 1, 0, 0, 0, 341, 342, 1, 0, 0, 0, 342, 375, 1, 0, 0, 0, 343, 345, 5, 46, 0, 0, 344, 346, 7, 3, 0, 0, 345, 344, 1, 0, 0, 0, 346, 347, 1, 0, 0, 0, 347, 345, 1, 0, 0, 0, 347, 348, 1, 0, 0, 0, 348, 358, 1, 0, 0, 0, 349, 351, 7, 4, 0, 0, 350, 352, 7, 5, 0, 0, 351, 350, 1, 0, 0, 0, 351, 352, 1, 0, 0, 0, 352, 354, 1, 0, 0, 0, 353, 355, 7, 3, 0, 0, 354, 353, 1, 0, 0, 0, 355, 356, 1, 0, 0, 0, 356, 354, 1, 0, 0, 0, 356, 357, 1, 0, 0, 0, 357, 359, 1, 0, 0, 0, 358, 349, 1, 0, 0, 0, 358, 359, 1, 0, 0, 0, 359, 375, 1, 0, 0, 0, 360, 362, 7, 3, 0, 0, 361, 360, 1, 0, 0, 0, 362, 363, 1, 0, 0, 0, 363, 361, 1, 0, 0, 0, 363, 364, 1, 0, 0, 0, 364, 365, 1, 0, 0, 0, 365, 367, 7, 4, 0, 0, 366, 368, 7, 5, 0, 0, 367, 366, 1, 0, 0, 0, 367, 368, 1, 0, 0, 0, 368, 370, 1, 0, 0, 0, 369, 371, 7, 3, 0, 0, 370, 369, 1, 0, 0, 0, 371, 372, 1, 0, 0, 0, 372, 370, 1, 0, 0, 0, 372, 373, 1, 0, 0, 0, 373, 375, 1, 0, 0, 0, 374, 322, 1, 0, 0, 0, 374, 343, 1, 0, 0, 0, 374, 361, 1, 0, 0, 0, 375, 100, 1, 0, 0, 0, 376, 377, 5, 34, 0, 0, 377, 378, 7, 6, 0, 0, 378, 379, 5, 34, 0, 0, 379, 102, 1, 0, 0, 0, 380, 381, 5, 42, 0, 0, 381, 104, 1, 0, 0, 0, 382, 387, 5, 34, 0, 0, 383, 386, 3, 107, 53, 0, 384, 386, 8, 7, 0, 0, 385, 383, 1, 0, 0, 0, 385, 384, 1, 0, 0, 0, 386, 389, 1, 0, 0, 0, 387, 385, 1, 0, 0, 0, 387, 388, 1, 0, 0, 0, 388, 390, 1, 0, 0, 0, 389, 387, 1, 0, 0, 0, 390, 391, 5, 34, 0, 0, 391, 106, 1, 0, 0, 0, 392, 393, 5, 92, 0, 0, 393, 394, 7, 8, 0, 0, 394, 108, 1, 0, 0, 0, 395, 397, 7, 9, 0, 0, 396, 395, 1, 0, 0, 0, 397, 398, 1, 0, 0, 0, 398, 396, 1, 0, 0, 0, 398, 399, 1, 0, 0, 0, 399, 400, 1, 0, 0, 0, 400, 401, 6, 54, 0, 0, 401, 110, 1, 0, 0, 0, 23, 0, 276, 287, 299, 303, 308, 319, 324, 330, 334, 339, 341, 347, 351, 356, 358, 363, 367, 372, 374, 385, 387, 398, 1, 6, 0, 0] \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.py new file mode 100644 index 00000000000..bd93f866972 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.py @@ -0,0 +1,259 @@ +# Generated from CASS.g4 by ANTLR 4.13.2 +from antlr4 import * +from io import StringIO +import sys +if sys.version_info[1] > 5: + from typing import TextIO +else: + from typing.io import TextIO + + +def serializedATN(): + return [ + 4,0,54,402,6,-1,2,0,7,0,2,1,7,1,2,2,7,2,2,3,7,3,2,4,7,4,2,5,7,5, + 2,6,7,6,2,7,7,7,2,8,7,8,2,9,7,9,2,10,7,10,2,11,7,11,2,12,7,12,2, + 13,7,13,2,14,7,14,2,15,7,15,2,16,7,16,2,17,7,17,2,18,7,18,2,19,7, + 19,2,20,7,20,2,21,7,21,2,22,7,22,2,23,7,23,2,24,7,24,2,25,7,25,2, + 26,7,26,2,27,7,27,2,28,7,28,2,29,7,29,2,30,7,30,2,31,7,31,2,32,7, + 32,2,33,7,33,2,34,7,34,2,35,7,35,2,36,7,36,2,37,7,37,2,38,7,38,2, + 39,7,39,2,40,7,40,2,41,7,41,2,42,7,42,2,43,7,43,2,44,7,44,2,45,7, + 45,2,46,7,46,2,47,7,47,2,48,7,48,2,49,7,49,2,50,7,50,2,51,7,51,2, + 52,7,52,2,53,7,53,2,54,7,54,1,0,1,0,1,1,1,1,1,2,1,2,1,3,1,3,1,4, + 1,4,1,5,1,5,1,6,1,6,1,6,1,6,1,7,1,7,1,7,1,7,1,7,1,7,1,8,1,8,1,8, + 1,9,1,9,1,9,1,9,1,9,1,10,1,10,1,10,1,10,1,10,1,10,1,10,1,11,1,11, + 1,11,1,11,1,11,1,12,1,12,1,13,1,13,1,14,1,14,1,15,1,15,1,16,1,16, + 1,16,1,16,1,16,1,16,1,16,1,16,1,17,1,17,1,17,1,17,1,17,1,17,1,17, + 1,18,1,18,1,18,1,18,1,18,1,18,1,18,1,18,1,19,1,19,1,19,1,19,1,20, + 1,20,1,20,1,20,1,20,1,20,1,21,1,21,1,21,1,21,1,21,1,21,1,21,1,22, + 1,22,1,22,1,22,1,22,1,23,1,23,1,23,1,23,1,23,1,23,1,23,1,23,1,24, + 1,24,1,24,1,24,1,24,1,24,1,25,1,25,1,25,1,26,1,26,1,26,1,27,1,27, + 1,28,1,28,1,29,1,29,1,29,1,30,1,30,1,30,1,31,1,31,1,32,1,32,1,32, + 1,33,1,33,1,33,1,34,1,34,1,34,1,35,1,35,1,35,1,36,1,36,1,36,1,37, + 1,37,1,37,1,38,1,38,1,38,1,39,1,39,1,39,1,40,1,40,1,41,1,41,1,42, + 1,42,1,43,1,43,1,44,1,44,1,44,1,44,5,44,275,8,44,10,44,12,44,278, + 9,44,1,44,1,44,1,45,1,45,1,45,1,45,5,45,286,8,45,10,45,12,45,289, + 9,45,1,45,1,45,1,45,1,45,1,45,1,46,1,46,5,46,298,8,46,10,46,12,46, + 301,9,46,1,47,3,47,304,8,47,1,47,4,47,307,8,47,11,47,12,47,308,1, + 48,1,48,1,48,1,48,1,48,1,48,1,48,1,48,1,48,3,48,320,8,48,1,49,4, + 49,323,8,49,11,49,12,49,324,1,49,1,49,4,49,329,8,49,11,49,12,49, + 330,1,49,1,49,3,49,335,8,49,1,49,4,49,338,8,49,11,49,12,49,339,3, + 49,342,8,49,1,49,1,49,4,49,346,8,49,11,49,12,49,347,1,49,1,49,3, + 49,352,8,49,1,49,4,49,355,8,49,11,49,12,49,356,3,49,359,8,49,1,49, + 4,49,362,8,49,11,49,12,49,363,1,49,1,49,3,49,368,8,49,1,49,4,49, + 371,8,49,11,49,12,49,372,3,49,375,8,49,1,50,1,50,1,50,1,50,1,51, + 1,51,1,52,1,52,1,52,5,52,386,8,52,10,52,12,52,389,9,52,1,52,1,52, + 1,53,1,53,1,53,1,54,4,54,397,8,54,11,54,12,54,398,1,54,1,54,1,287, + 0,55,1,1,3,2,5,3,7,4,9,5,11,6,13,7,15,8,17,9,19,10,21,11,23,12,25, + 13,27,14,29,15,31,16,33,17,35,18,37,19,39,20,41,21,43,22,45,23,47, + 24,49,25,51,26,53,27,55,28,57,29,59,30,61,31,63,32,65,33,67,34,69, + 35,71,36,73,37,75,38,77,39,79,40,81,41,83,42,85,43,87,44,89,45,91, + 46,93,47,95,48,97,49,99,50,101,51,103,52,105,53,107,0,109,54,1,0, + 10,2,0,10,10,13,13,3,0,65,90,95,95,97,122,4,0,48,57,65,90,95,95, + 97,122,1,0,48,57,2,0,69,69,101,101,2,0,43,43,45,45,2,0,65,90,97, + 122,2,0,34,34,92,92,8,0,34,34,39,39,92,92,98,98,102,102,110,110, + 114,114,116,116,3,0,9,10,13,13,32,32,423,0,1,1,0,0,0,0,3,1,0,0,0, + 0,5,1,0,0,0,0,7,1,0,0,0,0,9,1,0,0,0,0,11,1,0,0,0,0,13,1,0,0,0,0, + 15,1,0,0,0,0,17,1,0,0,0,0,19,1,0,0,0,0,21,1,0,0,0,0,23,1,0,0,0,0, + 25,1,0,0,0,0,27,1,0,0,0,0,29,1,0,0,0,0,31,1,0,0,0,0,33,1,0,0,0,0, + 35,1,0,0,0,0,37,1,0,0,0,0,39,1,0,0,0,0,41,1,0,0,0,0,43,1,0,0,0,0, + 45,1,0,0,0,0,47,1,0,0,0,0,49,1,0,0,0,0,51,1,0,0,0,0,53,1,0,0,0,0, + 55,1,0,0,0,0,57,1,0,0,0,0,59,1,0,0,0,0,61,1,0,0,0,0,63,1,0,0,0,0, + 65,1,0,0,0,0,67,1,0,0,0,0,69,1,0,0,0,0,71,1,0,0,0,0,73,1,0,0,0,0, + 75,1,0,0,0,0,77,1,0,0,0,0,79,1,0,0,0,0,81,1,0,0,0,0,83,1,0,0,0,0, + 85,1,0,0,0,0,87,1,0,0,0,0,89,1,0,0,0,0,91,1,0,0,0,0,93,1,0,0,0,0, + 95,1,0,0,0,0,97,1,0,0,0,0,99,1,0,0,0,0,101,1,0,0,0,0,103,1,0,0,0, + 0,105,1,0,0,0,0,109,1,0,0,0,1,111,1,0,0,0,3,113,1,0,0,0,5,115,1, + 0,0,0,7,117,1,0,0,0,9,119,1,0,0,0,11,121,1,0,0,0,13,123,1,0,0,0, + 15,127,1,0,0,0,17,133,1,0,0,0,19,136,1,0,0,0,21,141,1,0,0,0,23,148, + 1,0,0,0,25,153,1,0,0,0,27,155,1,0,0,0,29,157,1,0,0,0,31,159,1,0, + 0,0,33,161,1,0,0,0,35,169,1,0,0,0,37,176,1,0,0,0,39,184,1,0,0,0, + 41,188,1,0,0,0,43,194,1,0,0,0,45,201,1,0,0,0,47,206,1,0,0,0,49,214, + 1,0,0,0,51,220,1,0,0,0,53,223,1,0,0,0,55,226,1,0,0,0,57,228,1,0, + 0,0,59,230,1,0,0,0,61,233,1,0,0,0,63,236,1,0,0,0,65,238,1,0,0,0, + 67,241,1,0,0,0,69,244,1,0,0,0,71,247,1,0,0,0,73,250,1,0,0,0,75,253, + 1,0,0,0,77,256,1,0,0,0,79,259,1,0,0,0,81,262,1,0,0,0,83,264,1,0, + 0,0,85,266,1,0,0,0,87,268,1,0,0,0,89,270,1,0,0,0,91,281,1,0,0,0, + 93,295,1,0,0,0,95,303,1,0,0,0,97,319,1,0,0,0,99,374,1,0,0,0,101, + 376,1,0,0,0,103,380,1,0,0,0,105,382,1,0,0,0,107,392,1,0,0,0,109, + 396,1,0,0,0,111,112,5,40,0,0,112,2,1,0,0,0,113,114,5,41,0,0,114, + 4,1,0,0,0,115,116,5,123,0,0,116,6,1,0,0,0,117,118,5,125,0,0,118, + 8,1,0,0,0,119,120,5,61,0,0,120,10,1,0,0,0,121,122,5,59,0,0,122,12, + 1,0,0,0,123,124,5,102,0,0,124,125,5,111,0,0,125,126,5,114,0,0,126, + 14,1,0,0,0,127,128,5,119,0,0,128,129,5,104,0,0,129,130,5,105,0,0, + 130,131,5,108,0,0,131,132,5,101,0,0,132,16,1,0,0,0,133,134,5,105, + 0,0,134,135,5,102,0,0,135,18,1,0,0,0,136,137,5,101,0,0,137,138,5, + 108,0,0,138,139,5,115,0,0,139,140,5,101,0,0,140,20,1,0,0,0,141,142, + 5,115,0,0,142,143,5,119,0,0,143,144,5,105,0,0,144,145,5,116,0,0, + 145,146,5,99,0,0,146,147,5,104,0,0,147,22,1,0,0,0,148,149,5,99,0, + 0,149,150,5,97,0,0,150,151,5,115,0,0,151,152,5,101,0,0,152,24,1, + 0,0,0,153,154,5,58,0,0,154,26,1,0,0,0,155,156,5,91,0,0,156,28,1, + 0,0,0,157,158,5,93,0,0,158,30,1,0,0,0,159,160,5,44,0,0,160,32,1, + 0,0,0,161,162,5,110,0,0,162,163,5,117,0,0,163,164,5,108,0,0,164, + 165,5,108,0,0,165,166,5,112,0,0,166,167,5,116,0,0,167,168,5,114, + 0,0,168,34,1,0,0,0,169,170,5,114,0,0,170,171,5,101,0,0,171,172,5, + 116,0,0,172,173,5,117,0,0,173,174,5,114,0,0,174,175,5,110,0,0,175, + 36,1,0,0,0,176,177,5,105,0,0,177,178,5,110,0,0,178,179,5,99,0,0, + 179,180,5,108,0,0,180,181,5,117,0,0,181,182,5,100,0,0,182,183,5, + 101,0,0,183,38,1,0,0,0,184,185,5,105,0,0,185,186,5,110,0,0,186,187, + 5,116,0,0,187,40,1,0,0,0,188,189,5,102,0,0,189,190,5,108,0,0,190, + 191,5,111,0,0,191,192,5,97,0,0,192,193,5,116,0,0,193,42,1,0,0,0, + 194,195,5,100,0,0,195,196,5,111,0,0,196,197,5,117,0,0,197,198,5, + 98,0,0,198,199,5,108,0,0,199,200,5,101,0,0,200,44,1,0,0,0,201,202, + 5,118,0,0,202,203,5,111,0,0,203,204,5,105,0,0,204,205,5,100,0,0, + 205,46,1,0,0,0,206,207,5,100,0,0,207,208,5,101,0,0,208,209,5,102, + 0,0,209,210,5,97,0,0,210,211,5,117,0,0,211,212,5,108,0,0,212,213, + 5,116,0,0,213,48,1,0,0,0,214,215,5,98,0,0,215,216,5,114,0,0,216, + 217,5,101,0,0,217,218,5,97,0,0,218,219,5,107,0,0,219,50,1,0,0,0, + 220,221,5,43,0,0,221,222,5,43,0,0,222,52,1,0,0,0,223,224,5,45,0, + 0,224,225,5,45,0,0,225,54,1,0,0,0,226,227,5,62,0,0,227,56,1,0,0, + 0,228,229,5,60,0,0,229,58,1,0,0,0,230,231,5,60,0,0,231,232,5,61, + 0,0,232,60,1,0,0,0,233,234,5,62,0,0,234,235,5,61,0,0,235,62,1,0, + 0,0,236,237,5,38,0,0,237,64,1,0,0,0,238,239,5,43,0,0,239,240,5,61, + 0,0,240,66,1,0,0,0,241,242,5,45,0,0,242,243,5,61,0,0,243,68,1,0, + 0,0,244,245,5,42,0,0,245,246,5,61,0,0,246,70,1,0,0,0,247,248,5,47, + 0,0,248,249,5,61,0,0,249,72,1,0,0,0,250,251,5,124,0,0,251,252,5, + 124,0,0,252,74,1,0,0,0,253,254,5,38,0,0,254,255,5,38,0,0,255,76, + 1,0,0,0,256,257,5,61,0,0,257,258,5,61,0,0,258,78,1,0,0,0,259,260, + 5,33,0,0,260,261,5,61,0,0,261,80,1,0,0,0,262,263,5,43,0,0,263,82, + 1,0,0,0,264,265,5,45,0,0,265,84,1,0,0,0,266,267,5,47,0,0,267,86, + 1,0,0,0,268,269,5,37,0,0,269,88,1,0,0,0,270,271,5,47,0,0,271,272, + 5,47,0,0,272,276,1,0,0,0,273,275,8,0,0,0,274,273,1,0,0,0,275,278, + 1,0,0,0,276,274,1,0,0,0,276,277,1,0,0,0,277,279,1,0,0,0,278,276, + 1,0,0,0,279,280,6,44,0,0,280,90,1,0,0,0,281,282,5,47,0,0,282,283, + 5,42,0,0,283,287,1,0,0,0,284,286,9,0,0,0,285,284,1,0,0,0,286,289, + 1,0,0,0,287,288,1,0,0,0,287,285,1,0,0,0,288,290,1,0,0,0,289,287, + 1,0,0,0,290,291,5,42,0,0,291,292,5,47,0,0,292,293,1,0,0,0,293,294, + 6,45,0,0,294,92,1,0,0,0,295,299,7,1,0,0,296,298,7,2,0,0,297,296, + 1,0,0,0,298,301,1,0,0,0,299,297,1,0,0,0,299,300,1,0,0,0,300,94,1, + 0,0,0,301,299,1,0,0,0,302,304,5,45,0,0,303,302,1,0,0,0,303,304,1, + 0,0,0,304,306,1,0,0,0,305,307,7,3,0,0,306,305,1,0,0,0,307,308,1, + 0,0,0,308,306,1,0,0,0,308,309,1,0,0,0,309,96,1,0,0,0,310,311,5,116, + 0,0,311,312,5,114,0,0,312,313,5,117,0,0,313,320,5,101,0,0,314,315, + 5,102,0,0,315,316,5,97,0,0,316,317,5,108,0,0,317,318,5,115,0,0,318, + 320,5,101,0,0,319,310,1,0,0,0,319,314,1,0,0,0,320,98,1,0,0,0,321, + 323,7,3,0,0,322,321,1,0,0,0,323,324,1,0,0,0,324,322,1,0,0,0,324, + 325,1,0,0,0,325,326,1,0,0,0,326,328,5,46,0,0,327,329,7,3,0,0,328, + 327,1,0,0,0,329,330,1,0,0,0,330,328,1,0,0,0,330,331,1,0,0,0,331, + 341,1,0,0,0,332,334,7,4,0,0,333,335,7,5,0,0,334,333,1,0,0,0,334, + 335,1,0,0,0,335,337,1,0,0,0,336,338,7,3,0,0,337,336,1,0,0,0,338, + 339,1,0,0,0,339,337,1,0,0,0,339,340,1,0,0,0,340,342,1,0,0,0,341, + 332,1,0,0,0,341,342,1,0,0,0,342,375,1,0,0,0,343,345,5,46,0,0,344, + 346,7,3,0,0,345,344,1,0,0,0,346,347,1,0,0,0,347,345,1,0,0,0,347, + 348,1,0,0,0,348,358,1,0,0,0,349,351,7,4,0,0,350,352,7,5,0,0,351, + 350,1,0,0,0,351,352,1,0,0,0,352,354,1,0,0,0,353,355,7,3,0,0,354, + 353,1,0,0,0,355,356,1,0,0,0,356,354,1,0,0,0,356,357,1,0,0,0,357, + 359,1,0,0,0,358,349,1,0,0,0,358,359,1,0,0,0,359,375,1,0,0,0,360, + 362,7,3,0,0,361,360,1,0,0,0,362,363,1,0,0,0,363,361,1,0,0,0,363, + 364,1,0,0,0,364,365,1,0,0,0,365,367,7,4,0,0,366,368,7,5,0,0,367, + 366,1,0,0,0,367,368,1,0,0,0,368,370,1,0,0,0,369,371,7,3,0,0,370, + 369,1,0,0,0,371,372,1,0,0,0,372,370,1,0,0,0,372,373,1,0,0,0,373, + 375,1,0,0,0,374,322,1,0,0,0,374,343,1,0,0,0,374,361,1,0,0,0,375, + 100,1,0,0,0,376,377,5,34,0,0,377,378,7,6,0,0,378,379,5,34,0,0,379, + 102,1,0,0,0,380,381,5,42,0,0,381,104,1,0,0,0,382,387,5,34,0,0,383, + 386,3,107,53,0,384,386,8,7,0,0,385,383,1,0,0,0,385,384,1,0,0,0,386, + 389,1,0,0,0,387,385,1,0,0,0,387,388,1,0,0,0,388,390,1,0,0,0,389, + 387,1,0,0,0,390,391,5,34,0,0,391,106,1,0,0,0,392,393,5,92,0,0,393, + 394,7,8,0,0,394,108,1,0,0,0,395,397,7,9,0,0,396,395,1,0,0,0,397, + 398,1,0,0,0,398,396,1,0,0,0,398,399,1,0,0,0,399,400,1,0,0,0,400, + 401,6,54,0,0,401,110,1,0,0,0,23,0,276,287,299,303,308,319,324,330, + 334,339,341,347,351,356,358,363,367,372,374,385,387,398,1,6,0,0 + ] + +class CASSLexer(Lexer): + + atn = ATNDeserializer().deserialize(serializedATN()) + + decisionsToDFA = [ DFA(ds, i) for i, ds in enumerate(atn.decisionToState) ] + + T__0 = 1 + T__1 = 2 + T__2 = 3 + T__3 = 4 + T__4 = 5 + T__5 = 6 + T__6 = 7 + T__7 = 8 + T__8 = 9 + T__9 = 10 + T__10 = 11 + T__11 = 12 + T__12 = 13 + T__13 = 14 + T__14 = 15 + T__15 = 16 + T__16 = 17 + T__17 = 18 + T__18 = 19 + T__19 = 20 + T__20 = 21 + T__21 = 22 + T__22 = 23 + T__23 = 24 + T__24 = 25 + T__25 = 26 + T__26 = 27 + T__27 = 28 + T__28 = 29 + T__29 = 30 + T__30 = 31 + T__31 = 32 + T__32 = 33 + T__33 = 34 + T__34 = 35 + T__35 = 36 + T__36 = 37 + T__37 = 38 + T__38 = 39 + T__39 = 40 + T__40 = 41 + T__41 = 42 + T__42 = 43 + T__43 = 44 + SL_COMMENT = 45 + ML_COMMENT = 46 + ID = 47 + INT = 48 + BOOL = 49 + FLOAT = 50 + CHAR = 51 + POINTER = 52 + STRING = 53 + WS = 54 + + channelNames = [ u"DEFAULT_TOKEN_CHANNEL", u"HIDDEN" ] + + modeNames = [ "DEFAULT_MODE" ] + + literalNames = [ "", + "'('", "')'", "'{'", "'}'", "'='", "';'", "'for'", "'while'", + "'if'", "'else'", "'switch'", "'case'", "':'", "'['", "']'", + "','", "'nullptr'", "'return'", "'include'", "'int'", "'float'", + "'double'", "'void'", "'default'", "'break'", "'++'", "'--'", + "'>'", "'<'", "'<='", "'>='", "'&'", "'+='", "'-='", "'*='", + "'/='", "'||'", "'&&'", "'=='", "'!='", "'+'", "'-'", "'/'", + "'%'", "'*'" ] + + symbolicNames = [ "", + "SL_COMMENT", "ML_COMMENT", "ID", "INT", "BOOL", "FLOAT", "CHAR", + "POINTER", "STRING", "WS" ] + + ruleNames = [ "T__0", "T__1", "T__2", "T__3", "T__4", "T__5", "T__6", + "T__7", "T__8", "T__9", "T__10", "T__11", "T__12", "T__13", + "T__14", "T__15", "T__16", "T__17", "T__18", "T__19", + "T__20", "T__21", "T__22", "T__23", "T__24", "T__25", + "T__26", "T__27", "T__28", "T__29", "T__30", "T__31", + "T__32", "T__33", "T__34", "T__35", "T__36", "T__37", + "T__38", "T__39", "T__40", "T__41", "T__42", "T__43", + "SL_COMMENT", "ML_COMMENT", "ID", "INT", "BOOL", "FLOAT", + "CHAR", "POINTER", "STRING", "ESC_SEQ", "WS" ] + + grammarFileName = "CASS.g4" + + def __init__(self, input=None, output:TextIO = sys.stdout): + super().__init__(input, output) + self.checkVersion("4.13.2") + self._interp = LexerATNSimulator(self, self.atn, self.decisionsToDFA, PredictionContextCache()) + self._actions = None + self._predicates = None + + diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.tokens b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.tokens new file mode 100644 index 00000000000..ffe14a736f0 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSLexer.tokens @@ -0,0 +1,99 @@ +T__0=1 +T__1=2 +T__2=3 +T__3=4 +T__4=5 +T__5=6 +T__6=7 +T__7=8 +T__8=9 +T__9=10 +T__10=11 +T__11=12 +T__12=13 +T__13=14 +T__14=15 +T__15=16 +T__16=17 +T__17=18 +T__18=19 +T__19=20 +T__20=21 +T__21=22 +T__22=23 +T__23=24 +T__24=25 +T__25=26 +T__26=27 +T__27=28 +T__28=29 +T__29=30 +T__30=31 +T__31=32 +T__32=33 +T__33=34 +T__34=35 +T__35=36 +T__36=37 +T__37=38 +T__38=39 +T__39=40 +T__40=41 +T__41=42 +T__42=43 +T__43=44 +SL_COMMENT=45 +ML_COMMENT=46 +ID=47 +INT=48 +BOOL=49 +FLOAT=50 +CHAR=51 +POINTER=52 +STRING=53 +WS=54 +'('=1 +')'=2 +'{'=3 +'}'=4 +'='=5 +';'=6 +'for'=7 +'while'=8 +'if'=9 +'else'=10 +'switch'=11 +'case'=12 +':'=13 +'['=14 +']'=15 +','=16 +'nullptr'=17 +'return'=18 +'include'=19 +'int'=20 +'float'=21 +'double'=22 +'void'=23 +'default'=24 +'break'=25 +'++'=26 +'--'=27 +'>'=28 +'<'=29 +'<='=30 +'>='=31 +'&'=32 +'+='=33 +'-='=34 +'*='=35 +'/='=36 +'||'=37 +'&&'=38 +'=='=39 +'!='=40 +'+'=41 +'-'=42 +'/'=43 +'%'=44 +'*'=52 diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSListener.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSListener.py new file mode 100644 index 00000000000..2ecfa54026d --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSListener.py @@ -0,0 +1,399 @@ +# Generated from CASS.g4 by ANTLR 4.13.2 +from antlr4 import * +if "." in __name__: + from .CASSParser import CASSParser +else: + from CASSParser import CASSParser + +# This class defines a complete listener for a parse tree produced by CASSParser. +class CASSListener(ParseTreeListener): + + # Enter a parse tree produced by CASSParser#prog. + def enterProg(self, ctx:CASSParser.ProgContext): + pass + + # Exit a parse tree produced by CASSParser#prog. + def exitProg(self, ctx:CASSParser.ProgContext): + pass + + + # Enter a parse tree produced by CASSParser#functionDefinition. + def enterFunctionDefinition(self, ctx:CASSParser.FunctionDefinitionContext): + pass + + # Exit a parse tree produced by CASSParser#functionDefinition. + def exitFunctionDefinition(self, ctx:CASSParser.FunctionDefinitionContext): + pass + + + # Enter a parse tree produced by CASSParser#compoundStatement. + def enterCompoundStatement(self, ctx:CASSParser.CompoundStatementContext): + pass + + # Exit a parse tree produced by CASSParser#compoundStatement. + def exitCompoundStatement(self, ctx:CASSParser.CompoundStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#statement. + def enterStatement(self, ctx:CASSParser.StatementContext): + pass + + # Exit a parse tree produced by CASSParser#statement. + def exitStatement(self, ctx:CASSParser.StatementContext): + pass + + + # Enter a parse tree produced by CASSParser#declarationStatement. + def enterDeclarationStatement(self, ctx:CASSParser.DeclarationStatementContext): + pass + + # Exit a parse tree produced by CASSParser#declarationStatement. + def exitDeclarationStatement(self, ctx:CASSParser.DeclarationStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#forBlockStatement. + def enterForBlockStatement(self, ctx:CASSParser.ForBlockStatementContext): + pass + + # Exit a parse tree produced by CASSParser#forBlockStatement. + def exitForBlockStatement(self, ctx:CASSParser.ForBlockStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#forSingleStatement. + def enterForSingleStatement(self, ctx:CASSParser.ForSingleStatementContext): + pass + + # Exit a parse tree produced by CASSParser#forSingleStatement. + def exitForSingleStatement(self, ctx:CASSParser.ForSingleStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#conditionClause. + def enterConditionClause(self, ctx:CASSParser.ConditionClauseContext): + pass + + # Exit a parse tree produced by CASSParser#conditionClause. + def exitConditionClause(self, ctx:CASSParser.ConditionClauseContext): + pass + + + # Enter a parse tree produced by CASSParser#whileBlockStatement. + def enterWhileBlockStatement(self, ctx:CASSParser.WhileBlockStatementContext): + pass + + # Exit a parse tree produced by CASSParser#whileBlockStatement. + def exitWhileBlockStatement(self, ctx:CASSParser.WhileBlockStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#whileSingleStatement. + def enterWhileSingleStatement(self, ctx:CASSParser.WhileSingleStatementContext): + pass + + # Exit a parse tree produced by CASSParser#whileSingleStatement. + def exitWhileSingleStatement(self, ctx:CASSParser.WhileSingleStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#ifBlockStatement. + def enterIfBlockStatement(self, ctx:CASSParser.IfBlockStatementContext): + pass + + # Exit a parse tree produced by CASSParser#ifBlockStatement. + def exitIfBlockStatement(self, ctx:CASSParser.IfBlockStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#ifSingleStatement. + def enterIfSingleStatement(self, ctx:CASSParser.IfSingleStatementContext): + pass + + # Exit a parse tree produced by CASSParser#ifSingleStatement. + def exitIfSingleStatement(self, ctx:CASSParser.IfSingleStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#elseClause. + def enterElseClause(self, ctx:CASSParser.ElseClauseContext): + pass + + # Exit a parse tree produced by CASSParser#elseClause. + def exitElseClause(self, ctx:CASSParser.ElseClauseContext): + pass + + + # Enter a parse tree produced by CASSParser#switchStatement. + def enterSwitchStatement(self, ctx:CASSParser.SwitchStatementContext): + pass + + # Exit a parse tree produced by CASSParser#switchStatement. + def exitSwitchStatement(self, ctx:CASSParser.SwitchStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#caseStatement. + def enterCaseStatement(self, ctx:CASSParser.CaseStatementContext): + pass + + # Exit a parse tree produced by CASSParser#caseStatement. + def exitCaseStatement(self, ctx:CASSParser.CaseStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#functionCall. + def enterFunctionCall(self, ctx:CASSParser.FunctionCallContext): + pass + + # Exit a parse tree produced by CASSParser#functionCall. + def exitFunctionCall(self, ctx:CASSParser.FunctionCallContext): + pass + + + # Enter a parse tree produced by CASSParser#arrayDeclarator. + def enterArrayDeclarator(self, ctx:CASSParser.ArrayDeclaratorContext): + pass + + # Exit a parse tree produced by CASSParser#arrayDeclarator. + def exitArrayDeclarator(self, ctx:CASSParser.ArrayDeclaratorContext): + pass + + + # Enter a parse tree produced by CASSParser#listInitializer. + def enterListInitializer(self, ctx:CASSParser.ListInitializerContext): + pass + + # Exit a parse tree produced by CASSParser#listInitializer. + def exitListInitializer(self, ctx:CASSParser.ListInitializerContext): + pass + + + # Enter a parse tree produced by CASSParser#emptyInitializer. + def enterEmptyInitializer(self, ctx:CASSParser.EmptyInitializerContext): + pass + + # Exit a parse tree produced by CASSParser#emptyInitializer. + def exitEmptyInitializer(self, ctx:CASSParser.EmptyInitializerContext): + pass + + + # Enter a parse tree produced by CASSParser#nullptr. + def enterNullptr(self, ctx:CASSParser.NullptrContext): + pass + + # Exit a parse tree produced by CASSParser#nullptr. + def exitNullptr(self, ctx:CASSParser.NullptrContext): + pass + + + # Enter a parse tree produced by CASSParser#argumentList. + def enterArgumentList(self, ctx:CASSParser.ArgumentListContext): + pass + + # Exit a parse tree produced by CASSParser#argumentList. + def exitArgumentList(self, ctx:CASSParser.ArgumentListContext): + pass + + + # Enter a parse tree produced by CASSParser#returnStatement. + def enterReturnStatement(self, ctx:CASSParser.ReturnStatementContext): + pass + + # Exit a parse tree produced by CASSParser#returnStatement. + def exitReturnStatement(self, ctx:CASSParser.ReturnStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#expressionStatement. + def enterExpressionStatement(self, ctx:CASSParser.ExpressionStatementContext): + pass + + # Exit a parse tree produced by CASSParser#expressionStatement. + def exitExpressionStatement(self, ctx:CASSParser.ExpressionStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#includeStatement. + def enterIncludeStatement(self, ctx:CASSParser.IncludeStatementContext): + pass + + # Exit a parse tree produced by CASSParser#includeStatement. + def exitIncludeStatement(self, ctx:CASSParser.IncludeStatementContext): + pass + + + # Enter a parse tree produced by CASSParser#parameterList. + def enterParameterList(self, ctx:CASSParser.ParameterListContext): + pass + + # Exit a parse tree produced by CASSParser#parameterList. + def exitParameterList(self, ctx:CASSParser.ParameterListContext): + pass + + + # Enter a parse tree produced by CASSParser#parameter. + def enterParameter(self, ctx:CASSParser.ParameterContext): + pass + + # Exit a parse tree produced by CASSParser#parameter. + def exitParameter(self, ctx:CASSParser.ParameterContext): + pass + + + # Enter a parse tree produced by CASSParser#typeSpec. + def enterTypeSpec(self, ctx:CASSParser.TypeSpecContext): + pass + + # Exit a parse tree produced by CASSParser#typeSpec. + def exitTypeSpec(self, ctx:CASSParser.TypeSpecContext): + pass + + + # Enter a parse tree produced by CASSParser#expression. + def enterExpression(self, ctx:CASSParser.ExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#expression. + def exitExpression(self, ctx:CASSParser.ExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#defaultExpression. + def enterDefaultExpression(self, ctx:CASSParser.DefaultExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#defaultExpression. + def exitDefaultExpression(self, ctx:CASSParser.DefaultExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#breakExpression. + def enterBreakExpression(self, ctx:CASSParser.BreakExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#breakExpression. + def exitBreakExpression(self, ctx:CASSParser.BreakExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#assignmentExpression. + def enterAssignmentExpression(self, ctx:CASSParser.AssignmentExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#assignmentExpression. + def exitAssignmentExpression(self, ctx:CASSParser.AssignmentExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#unaryExpression. + def enterUnaryExpression(self, ctx:CASSParser.UnaryExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#unaryExpression. + def exitUnaryExpression(self, ctx:CASSParser.UnaryExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#comparingExpression. + def enterComparingExpression(self, ctx:CASSParser.ComparingExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#comparingExpression. + def exitComparingExpression(self, ctx:CASSParser.ComparingExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#primaryExpression. + def enterPrimaryExpression(self, ctx:CASSParser.PrimaryExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#primaryExpression. + def exitPrimaryExpression(self, ctx:CASSParser.PrimaryExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#pointerExpression. + def enterPointerExpression(self, ctx:CASSParser.PointerExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#pointerExpression. + def exitPointerExpression(self, ctx:CASSParser.PointerExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#assignmentOperator. + def enterAssignmentOperator(self, ctx:CASSParser.AssignmentOperatorContext): + pass + + # Exit a parse tree produced by CASSParser#assignmentOperator. + def exitAssignmentOperator(self, ctx:CASSParser.AssignmentOperatorContext): + pass + + + # Enter a parse tree produced by CASSParser#logicalOrExpression. + def enterLogicalOrExpression(self, ctx:CASSParser.LogicalOrExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#logicalOrExpression. + def exitLogicalOrExpression(self, ctx:CASSParser.LogicalOrExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#logicalAndExpression. + def enterLogicalAndExpression(self, ctx:CASSParser.LogicalAndExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#logicalAndExpression. + def exitLogicalAndExpression(self, ctx:CASSParser.LogicalAndExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#equalityExpression. + def enterEqualityExpression(self, ctx:CASSParser.EqualityExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#equalityExpression. + def exitEqualityExpression(self, ctx:CASSParser.EqualityExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#relationalExpression. + def enterRelationalExpression(self, ctx:CASSParser.RelationalExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#relationalExpression. + def exitRelationalExpression(self, ctx:CASSParser.RelationalExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#additiveExpression. + def enterAdditiveExpression(self, ctx:CASSParser.AdditiveExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#additiveExpression. + def exitAdditiveExpression(self, ctx:CASSParser.AdditiveExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#multiplicativeExpression. + def enterMultiplicativeExpression(self, ctx:CASSParser.MultiplicativeExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#multiplicativeExpression. + def exitMultiplicativeExpression(self, ctx:CASSParser.MultiplicativeExpressionContext): + pass + + + # Enter a parse tree produced by CASSParser#operationExpression. + def enterOperationExpression(self, ctx:CASSParser.OperationExpressionContext): + pass + + # Exit a parse tree produced by CASSParser#operationExpression. + def exitOperationExpression(self, ctx:CASSParser.OperationExpressionContext): + pass + + + +del CASSParser \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSNode.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSNode.py new file mode 100644 index 00000000000..68c3d76313d --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSNode.py @@ -0,0 +1,179 @@ +class CassNode: + def __init__(self, label): + + self.label = str(label) + self.children = [] + self.prevUse = -1 # keep track of the prev node usage + self.nextUse = -1 + + self.source_range = None + + def add_child(self, child): + self.children.append(child) + + # Creating the Cass string + def to_cass_string(self) -> str: + + cass_strings = [] # Store each function separately + node_counter = {"current_id": 1} # Start numbering at 1 for each function + + def traverse(node): + if node.label == "removed": + return "".join(traverse(child) for child in node.children) + + child_strings = [traverse(c) for c in node.children] + + if node.label.startswith("v"): + return (f"{node.label}\t{node.prevUse}\t{node.nextUse}\t" + "".join(child_strings)) + + if node.label.startswith("V") or node.label.startswith(("N", "C", "S", "F")): + return f"{node.label}\t" + "".join(child_strings) + + child_count = len(node.children) + return f"{node.label}\t{child_count}\t" + "".join(child_strings) + + # Process each top-level function separately + for function_tree in self.children: + node_counter["current_id"] = 1 # Reset numbering for each function + cass_string = traverse(function_tree) + cass_strings.append(cass_string) + + return cass_strings # Return list of separate CASS strings + + def get_source_range_string(self): + """ + Return the source-range string in the format "0,0,5,1" + only if this node is a top-level S#FS function and + source_range is set. Otherwise return a default "0,0,0,0". + """ + if self.label.startswith("S#FS") and self.source_range is not None: + (start_l, start_c, end_l, end_c) = self.source_range + return f"{start_l},{start_c},{end_l},{end_c}" + else: + # Not S#FS or we don't have the source_range info + return "0,0,0,0" + + + + # Getting all nodes in a Cass tree + def get_node_count(self) -> int: + + node_counter = {"current_id": 1} # Start numbering at 1 + total_nodes = 0 + + def traverse(node): + nonlocal total_nodes + current_id = node_counter["current_id"] + + if node.label != "removed": + node_counter["current_id"] += 1 + total_nodes += 1 + + for child in node.children: + traverse(child) + + + traverse(self) + + return total_nodes + + # Generating a GraphViz DOT file with nodes numbered in the CASS-style creation order + def to_dot(self): + + lines = ["digraph CASS {", " node [shape=ellipse];"] + node_counter = {"current_id": 1} # Start numbering at 1 + edges = [] + node_map = {} # Keep track of nodes by ID + + def traverse(node, parent_id=None): + # Do not assign an ID or add the "removed" node + if node.label == "removed": + for child in node.children: + traverse(child, parent_id) # Attach children directly to parent + return + + current_id = node_counter["current_id"] + node_counter["current_id"] += 1 + + # Escape double quotes in label if necessary + safe_label = node.label.replace('"', '\\"') + node_map[current_id] = node.label # Store node label + + lines.append(f' n{current_id} [label="[{current_id}]: {safe_label}"];') + + # Create an edge from parent to the current node + if parent_id is not None: + edges.append(f' n{parent_id} -> n{current_id};') + + # Visit children in the order they were added + for child in node.children: + traverse(child, current_id) + + return current_id + + # **Step 1: Traverse children of "removed" root, skipping "removed" itself** + for child in self.children: + traverse(child) + + # **Step 2: Add remaining edges to the DOT file** + lines.extend(edges) + + # **Step 3: Close the DOT graph** + lines.append("}") + + return lines + + +""" + 1) Numbering the nodes according to preorder Depth First Search Algorithm. + 2) For each node referencing a local variable (label 'vX'), record it in usage_map. + 3) After collecting, fill in .prevUse and .nextUse. +""" + +def assign_usage_links(root: CassNode): + + usage_map = {} + + current_id = [0] + + def dfs(node: CassNode): + + if (node.label != "removed"): + this_index = current_id[0] + current_id[0] += 1 + + # If it's a local variable usage, store in usage_map + if node.label.startswith("v"): + var_name = node.label[1:] # "vsum" => "sum" + if var_name not in usage_map: + usage_map[var_name] = [] + usage_map[var_name].append((this_index, node)) + + # Recurse on children + for child in node.children: + dfs(child) + else: + + for child in node.children: + dfs(child) + + # Collect usage in a DFS + dfs(root) + + # For each variable, link up usage + for var_name, usage_list in usage_map.items(): + # usage_list is e.g. [(4, nodeObj), (8, nodeObj), (21, nodeObj)] + for i, (this_idx, node_obj) in enumerate(usage_list): + # prev + if i > 0: + prev_idx = usage_list[i-1][0] + node_obj.prevUse = prev_idx + else: + node_obj.prevUse = -1 + + # next + if i < len(usage_list)-1: + next_idx = usage_list[i+1][0] + node_obj.nextUse = next_idx + else: + node_obj.nextUse = -1 \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSParser.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSParser.py new file mode 100644 index 00000000000..c6a4f93e8ef --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSParser.py @@ -0,0 +1,3436 @@ +# Generated from CASS.g4 by ANTLR 4.13.2 +# encoding: utf-8 +from antlr4 import * +from io import StringIO +import sys +if sys.version_info[1] > 5: + from typing import TextIO +else: + from typing.io import TextIO + +def serializedATN(): + return [ + 4,1,54,415,2,0,7,0,2,1,7,1,2,2,7,2,2,3,7,3,2,4,7,4,2,5,7,5,2,6,7, + 6,2,7,7,7,2,8,7,8,2,9,7,9,2,10,7,10,2,11,7,11,2,12,7,12,2,13,7,13, + 2,14,7,14,2,15,7,15,2,16,7,16,2,17,7,17,2,18,7,18,2,19,7,19,2,20, + 7,20,2,21,7,21,2,22,7,22,2,23,7,23,2,24,7,24,2,25,7,25,2,26,7,26, + 2,27,7,27,2,28,7,28,2,29,7,29,2,30,7,30,2,31,7,31,2,32,7,32,2,33, + 7,33,2,34,7,34,2,35,7,35,2,36,7,36,2,37,7,37,2,38,7,38,2,39,7,39, + 2,40,7,40,2,41,7,41,2,42,7,42,1,0,4,0,88,8,0,11,0,12,0,89,1,0,1, + 0,1,1,1,1,1,1,1,1,3,1,98,8,1,1,1,1,1,1,1,1,2,1,2,5,2,105,8,2,10, + 2,12,2,108,9,2,1,2,1,2,1,3,1,3,1,3,1,3,1,3,1,3,1,3,1,3,1,3,1,3,1, + 3,1,3,1,3,3,3,125,8,3,1,4,1,4,5,4,129,8,4,10,4,12,4,132,9,4,1,4, + 1,4,1,4,3,4,137,8,4,1,4,1,4,1,4,1,4,1,4,1,4,3,4,145,8,4,3,4,147, + 8,4,1,4,3,4,150,8,4,1,5,1,5,1,5,1,5,1,5,3,5,157,8,5,1,5,1,5,1,5, + 1,5,1,5,1,5,1,5,1,6,1,6,1,6,3,6,169,8,6,1,6,1,6,3,6,173,8,6,1,6, + 1,6,1,6,1,6,1,6,1,6,1,6,1,7,1,7,1,8,1,8,1,8,1,8,1,8,1,8,1,9,1,9, + 1,9,1,9,1,9,1,9,1,10,1,10,1,10,1,10,1,10,1,10,3,10,202,8,10,1,11, + 1,11,1,11,1,11,1,11,1,11,3,11,210,8,11,1,12,1,12,1,12,1,12,3,12, + 216,8,12,1,13,1,13,1,13,1,13,1,13,1,13,1,14,1,14,3,14,226,8,14,1, + 14,3,14,229,8,14,1,14,1,14,5,14,233,8,14,10,14,12,14,236,9,14,1, + 14,3,14,239,8,14,1,15,1,15,1,15,3,15,244,8,15,1,15,1,15,1,16,1,16, + 1,16,3,16,251,8,16,1,16,1,16,1,17,1,17,1,17,1,17,5,17,259,8,17,10, + 17,12,17,262,9,17,1,17,1,17,1,18,1,18,1,18,1,19,1,19,1,20,1,20,1, + 20,5,20,274,8,20,10,20,12,20,277,9,20,1,21,1,21,3,21,281,8,21,1, + 21,1,21,1,22,1,22,1,22,1,23,1,23,1,23,1,24,1,24,1,24,5,24,294,8, + 24,10,24,12,24,297,9,24,1,25,1,25,1,25,1,26,1,26,1,27,1,27,3,27, + 306,8,27,1,28,1,28,1,29,1,29,1,29,1,30,1,30,1,30,1,30,3,30,317,8, + 30,1,30,3,30,320,8,30,1,30,3,30,323,8,30,1,31,1,31,1,31,1,31,1,31, + 1,31,3,31,331,8,31,1,31,1,31,5,31,335,8,31,10,31,12,31,338,9,31, + 1,32,1,32,1,33,1,33,1,33,1,33,1,33,1,33,1,33,1,33,1,33,1,33,1,33, + 3,33,353,8,33,1,34,1,34,1,34,1,34,3,34,359,8,34,1,35,1,35,1,36,1, + 36,1,36,5,36,366,8,36,10,36,12,36,369,9,36,1,37,1,37,1,37,5,37,374, + 8,37,10,37,12,37,377,9,37,1,38,1,38,1,38,5,38,382,8,38,10,38,12, + 38,385,9,38,1,39,1,39,1,39,5,39,390,8,39,10,39,12,39,393,9,39,1, + 40,1,40,1,40,5,40,398,8,40,10,40,12,40,401,9,40,1,41,1,41,1,41,5, + 41,406,8,41,10,41,12,41,409,9,41,1,42,1,42,3,42,413,8,42,1,42,0, + 1,62,43,0,2,4,6,8,10,12,14,16,18,20,22,24,26,28,30,32,34,36,38,40, + 42,44,46,48,50,52,54,56,58,60,62,64,66,68,70,72,74,76,78,80,82,84, + 0,7,1,0,20,23,1,0,26,27,1,0,28,31,2,0,5,5,33,36,1,0,39,40,1,0,41, + 42,2,0,43,44,52,52,437,0,87,1,0,0,0,2,93,1,0,0,0,4,102,1,0,0,0,6, + 124,1,0,0,0,8,126,1,0,0,0,10,151,1,0,0,0,12,165,1,0,0,0,14,181,1, + 0,0,0,16,183,1,0,0,0,18,189,1,0,0,0,20,195,1,0,0,0,22,203,1,0,0, + 0,24,211,1,0,0,0,26,217,1,0,0,0,28,225,1,0,0,0,30,240,1,0,0,0,32, + 247,1,0,0,0,34,254,1,0,0,0,36,265,1,0,0,0,38,268,1,0,0,0,40,270, + 1,0,0,0,42,278,1,0,0,0,44,284,1,0,0,0,46,287,1,0,0,0,48,290,1,0, + 0,0,50,298,1,0,0,0,52,301,1,0,0,0,54,305,1,0,0,0,56,307,1,0,0,0, + 58,309,1,0,0,0,60,322,1,0,0,0,62,330,1,0,0,0,64,339,1,0,0,0,66,352, + 1,0,0,0,68,358,1,0,0,0,70,360,1,0,0,0,72,362,1,0,0,0,74,370,1,0, + 0,0,76,378,1,0,0,0,78,386,1,0,0,0,80,394,1,0,0,0,82,402,1,0,0,0, + 84,412,1,0,0,0,86,88,3,6,3,0,87,86,1,0,0,0,88,89,1,0,0,0,89,87,1, + 0,0,0,89,90,1,0,0,0,90,91,1,0,0,0,91,92,5,0,0,1,92,1,1,0,0,0,93, + 94,3,52,26,0,94,95,3,66,33,0,95,97,5,1,0,0,96,98,3,48,24,0,97,96, + 1,0,0,0,97,98,1,0,0,0,98,99,1,0,0,0,99,100,5,2,0,0,100,101,3,4,2, + 0,101,3,1,0,0,0,102,106,5,3,0,0,103,105,3,6,3,0,104,103,1,0,0,0, + 105,108,1,0,0,0,106,104,1,0,0,0,106,107,1,0,0,0,107,109,1,0,0,0, + 108,106,1,0,0,0,109,110,5,4,0,0,110,5,1,0,0,0,111,125,3,8,4,0,112, + 125,3,10,5,0,113,125,3,12,6,0,114,125,3,16,8,0,115,125,3,18,9,0, + 116,125,3,20,10,0,117,125,3,22,11,0,118,125,3,42,21,0,119,125,3, + 26,13,0,120,125,3,28,14,0,121,125,3,44,22,0,122,125,3,2,1,0,123, + 125,3,46,23,0,124,111,1,0,0,0,124,112,1,0,0,0,124,113,1,0,0,0,124, + 114,1,0,0,0,124,115,1,0,0,0,124,116,1,0,0,0,124,117,1,0,0,0,124, + 118,1,0,0,0,124,119,1,0,0,0,124,120,1,0,0,0,124,121,1,0,0,0,124, + 122,1,0,0,0,124,123,1,0,0,0,125,7,1,0,0,0,126,130,3,52,26,0,127, + 129,5,52,0,0,128,127,1,0,0,0,129,132,1,0,0,0,130,128,1,0,0,0,130, + 131,1,0,0,0,131,136,1,0,0,0,132,130,1,0,0,0,133,137,3,66,33,0,134, + 137,1,0,0,0,135,137,3,32,16,0,136,133,1,0,0,0,136,134,1,0,0,0,136, + 135,1,0,0,0,137,146,1,0,0,0,138,144,5,5,0,0,139,145,3,54,27,0,140, + 145,1,0,0,0,141,145,3,38,19,0,142,145,1,0,0,0,143,145,3,36,18,0, + 144,139,1,0,0,0,144,140,1,0,0,0,144,141,1,0,0,0,144,142,1,0,0,0, + 144,143,1,0,0,0,145,147,1,0,0,0,146,138,1,0,0,0,146,147,1,0,0,0, + 147,149,1,0,0,0,148,150,5,6,0,0,149,148,1,0,0,0,149,150,1,0,0,0, + 150,9,1,0,0,0,151,152,5,7,0,0,152,156,5,1,0,0,153,157,3,8,4,0,154, + 157,1,0,0,0,155,157,3,60,30,0,156,153,1,0,0,0,156,154,1,0,0,0,156, + 155,1,0,0,0,157,158,1,0,0,0,158,159,5,6,0,0,159,160,3,72,36,0,160, + 161,5,6,0,0,161,162,3,62,31,0,162,163,5,2,0,0,163,164,3,4,2,0,164, + 11,1,0,0,0,165,166,5,7,0,0,166,172,5,1,0,0,167,169,3,8,4,0,168,167, + 1,0,0,0,168,169,1,0,0,0,169,173,1,0,0,0,170,173,1,0,0,0,171,173, + 3,60,30,0,172,168,1,0,0,0,172,170,1,0,0,0,172,171,1,0,0,0,173,174, + 1,0,0,0,174,175,5,6,0,0,175,176,3,72,36,0,176,177,5,6,0,0,177,178, + 3,62,31,0,178,179,5,2,0,0,179,180,3,6,3,0,180,13,1,0,0,0,181,182, + 3,72,36,0,182,15,1,0,0,0,183,184,5,8,0,0,184,185,5,1,0,0,185,186, + 3,14,7,0,186,187,5,2,0,0,187,188,3,4,2,0,188,17,1,0,0,0,189,190, + 5,8,0,0,190,191,5,1,0,0,191,192,3,14,7,0,192,193,5,2,0,0,193,194, + 3,6,3,0,194,19,1,0,0,0,195,196,5,9,0,0,196,197,5,1,0,0,197,198,3, + 14,7,0,198,199,5,2,0,0,199,201,3,4,2,0,200,202,3,24,12,0,201,200, + 1,0,0,0,201,202,1,0,0,0,202,21,1,0,0,0,203,204,5,9,0,0,204,205,5, + 1,0,0,205,206,3,14,7,0,206,207,5,2,0,0,207,209,3,6,3,0,208,210,3, + 24,12,0,209,208,1,0,0,0,209,210,1,0,0,0,210,23,1,0,0,0,211,215,5, + 10,0,0,212,216,3,4,2,0,213,216,3,20,10,0,214,216,3,6,3,0,215,212, + 1,0,0,0,215,213,1,0,0,0,215,214,1,0,0,0,216,25,1,0,0,0,217,218,5, + 11,0,0,218,219,5,1,0,0,219,220,3,14,7,0,220,221,5,2,0,0,221,222, + 3,4,2,0,222,27,1,0,0,0,223,226,5,12,0,0,224,226,3,56,28,0,225,223, + 1,0,0,0,225,224,1,0,0,0,226,228,1,0,0,0,227,229,3,66,33,0,228,227, + 1,0,0,0,228,229,1,0,0,0,229,230,1,0,0,0,230,234,5,13,0,0,231,233, + 3,6,3,0,232,231,1,0,0,0,233,236,1,0,0,0,234,232,1,0,0,0,234,235, + 1,0,0,0,235,238,1,0,0,0,236,234,1,0,0,0,237,239,3,58,29,0,238,237, + 1,0,0,0,238,239,1,0,0,0,239,29,1,0,0,0,240,241,5,47,0,0,241,243, + 5,1,0,0,242,244,3,40,20,0,243,242,1,0,0,0,243,244,1,0,0,0,244,245, + 1,0,0,0,245,246,5,2,0,0,246,31,1,0,0,0,247,248,3,66,33,0,248,250, + 5,14,0,0,249,251,3,66,33,0,250,249,1,0,0,0,250,251,1,0,0,0,251,252, + 1,0,0,0,252,253,5,15,0,0,253,33,1,0,0,0,254,255,5,3,0,0,255,260, + 3,66,33,0,256,257,5,16,0,0,257,259,3,66,33,0,258,256,1,0,0,0,259, + 262,1,0,0,0,260,258,1,0,0,0,260,261,1,0,0,0,261,263,1,0,0,0,262, + 260,1,0,0,0,263,264,5,4,0,0,264,35,1,0,0,0,265,266,5,3,0,0,266,267, + 5,4,0,0,267,37,1,0,0,0,268,269,5,17,0,0,269,39,1,0,0,0,270,275,3, + 54,27,0,271,272,5,16,0,0,272,274,3,54,27,0,273,271,1,0,0,0,274,277, + 1,0,0,0,275,273,1,0,0,0,275,276,1,0,0,0,276,41,1,0,0,0,277,275,1, + 0,0,0,278,280,5,18,0,0,279,281,3,54,27,0,280,279,1,0,0,0,280,281, + 1,0,0,0,281,282,1,0,0,0,282,283,5,6,0,0,283,43,1,0,0,0,284,285,3, + 54,27,0,285,286,5,6,0,0,286,45,1,0,0,0,287,288,5,19,0,0,288,289, + 5,53,0,0,289,47,1,0,0,0,290,295,3,50,25,0,291,292,5,16,0,0,292,294, + 3,50,25,0,293,291,1,0,0,0,294,297,1,0,0,0,295,293,1,0,0,0,295,296, + 1,0,0,0,296,49,1,0,0,0,297,295,1,0,0,0,298,299,3,52,26,0,299,300, + 3,66,33,0,300,51,1,0,0,0,301,302,7,0,0,0,302,53,1,0,0,0,303,306, + 3,60,30,0,304,306,3,30,15,0,305,303,1,0,0,0,305,304,1,0,0,0,306, + 55,1,0,0,0,307,308,5,24,0,0,308,57,1,0,0,0,309,310,5,25,0,0,310, + 311,5,6,0,0,311,59,1,0,0,0,312,313,3,62,31,0,313,314,3,70,35,0,314, + 316,3,60,30,0,315,317,3,38,19,0,316,315,1,0,0,0,316,317,1,0,0,0, + 317,319,1,0,0,0,318,320,3,36,18,0,319,318,1,0,0,0,319,320,1,0,0, + 0,320,323,1,0,0,0,321,323,3,72,36,0,322,312,1,0,0,0,322,321,1,0, + 0,0,323,61,1,0,0,0,324,325,6,31,-1,0,325,326,7,1,0,0,326,331,3,62, + 31,5,327,331,3,68,34,0,328,331,3,66,33,0,329,331,3,34,17,0,330,324, + 1,0,0,0,330,327,1,0,0,0,330,328,1,0,0,0,330,329,1,0,0,0,331,336, + 1,0,0,0,332,333,10,4,0,0,333,335,7,1,0,0,334,332,1,0,0,0,335,338, + 1,0,0,0,336,334,1,0,0,0,336,337,1,0,0,0,337,63,1,0,0,0,338,336,1, + 0,0,0,339,340,7,2,0,0,340,65,1,0,0,0,341,353,5,47,0,0,342,353,5, + 48,0,0,343,353,5,50,0,0,344,353,5,51,0,0,345,353,5,53,0,0,346,353, + 5,49,0,0,347,353,3,30,15,0,348,349,5,1,0,0,349,350,3,54,27,0,350, + 351,5,2,0,0,351,353,1,0,0,0,352,341,1,0,0,0,352,342,1,0,0,0,352, + 343,1,0,0,0,352,344,1,0,0,0,352,345,1,0,0,0,352,346,1,0,0,0,352, + 347,1,0,0,0,352,348,1,0,0,0,353,67,1,0,0,0,354,355,5,32,0,0,355, + 359,3,66,33,0,356,357,5,52,0,0,357,359,3,66,33,0,358,354,1,0,0,0, + 358,356,1,0,0,0,359,69,1,0,0,0,360,361,7,3,0,0,361,71,1,0,0,0,362, + 367,3,74,37,0,363,364,5,37,0,0,364,366,3,74,37,0,365,363,1,0,0,0, + 366,369,1,0,0,0,367,365,1,0,0,0,367,368,1,0,0,0,368,73,1,0,0,0,369, + 367,1,0,0,0,370,375,3,76,38,0,371,372,5,38,0,0,372,374,3,76,38,0, + 373,371,1,0,0,0,374,377,1,0,0,0,375,373,1,0,0,0,375,376,1,0,0,0, + 376,75,1,0,0,0,377,375,1,0,0,0,378,383,3,78,39,0,379,380,7,4,0,0, + 380,382,3,78,39,0,381,379,1,0,0,0,382,385,1,0,0,0,383,381,1,0,0, + 0,383,384,1,0,0,0,384,77,1,0,0,0,385,383,1,0,0,0,386,391,3,80,40, + 0,387,388,7,2,0,0,388,390,3,80,40,0,389,387,1,0,0,0,390,393,1,0, + 0,0,391,389,1,0,0,0,391,392,1,0,0,0,392,79,1,0,0,0,393,391,1,0,0, + 0,394,399,3,82,41,0,395,396,7,5,0,0,396,398,3,82,41,0,397,395,1, + 0,0,0,398,401,1,0,0,0,399,397,1,0,0,0,399,400,1,0,0,0,400,81,1,0, + 0,0,401,399,1,0,0,0,402,407,3,62,31,0,403,404,7,6,0,0,404,406,3, + 62,31,0,405,403,1,0,0,0,406,409,1,0,0,0,407,405,1,0,0,0,407,408, + 1,0,0,0,408,83,1,0,0,0,409,407,1,0,0,0,410,413,3,80,40,0,411,413, + 3,82,41,0,412,410,1,0,0,0,412,411,1,0,0,0,413,85,1,0,0,0,40,89,97, + 106,124,130,136,144,146,149,156,168,172,201,209,215,225,228,234, + 238,243,250,260,275,280,295,305,316,319,322,330,336,352,358,367, + 375,383,391,399,407,412 + ] + +class CASSParser ( Parser ): + + grammarFileName = "CASS.g4" + + atn = ATNDeserializer().deserialize(serializedATN()) + + decisionsToDFA = [ DFA(ds, i) for i, ds in enumerate(atn.decisionToState) ] + + sharedContextCache = PredictionContextCache() + + literalNames = [ "", "'('", "')'", "'{'", "'}'", "'='", "';'", + "'for'", "'while'", "'if'", "'else'", "'switch'", "'case'", + "':'", "'['", "']'", "','", "'nullptr'", "'return'", + "'include'", "'int'", "'float'", "'double'", "'void'", + "'default'", "'break'", "'++'", "'--'", "'>'", "'<'", + "'<='", "'>='", "'&'", "'+='", "'-='", "'*='", "'/='", + "'||'", "'&&'", "'=='", "'!='", "'+'", "'-'", "'/'", + "'%'", "", "", "", "", + "", "", "", "'*'" ] + + symbolicNames = [ "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "", "", "", + "", "SL_COMMENT", "ML_COMMENT", "ID", "INT", + "BOOL", "FLOAT", "CHAR", "POINTER", "STRING", "WS" ] + + RULE_prog = 0 + RULE_functionDefinition = 1 + RULE_compoundStatement = 2 + RULE_statement = 3 + RULE_declarationStatement = 4 + RULE_forBlockStatement = 5 + RULE_forSingleStatement = 6 + RULE_conditionClause = 7 + RULE_whileBlockStatement = 8 + RULE_whileSingleStatement = 9 + RULE_ifBlockStatement = 10 + RULE_ifSingleStatement = 11 + RULE_elseClause = 12 + RULE_switchStatement = 13 + RULE_caseStatement = 14 + RULE_functionCall = 15 + RULE_arrayDeclarator = 16 + RULE_listInitializer = 17 + RULE_emptyInitializer = 18 + RULE_nullptr = 19 + RULE_argumentList = 20 + RULE_returnStatement = 21 + RULE_expressionStatement = 22 + RULE_includeStatement = 23 + RULE_parameterList = 24 + RULE_parameter = 25 + RULE_typeSpec = 26 + RULE_expression = 27 + RULE_defaultExpression = 28 + RULE_breakExpression = 29 + RULE_assignmentExpression = 30 + RULE_unaryExpression = 31 + RULE_comparingExpression = 32 + RULE_primaryExpression = 33 + RULE_pointerExpression = 34 + RULE_assignmentOperator = 35 + RULE_logicalOrExpression = 36 + RULE_logicalAndExpression = 37 + RULE_equalityExpression = 38 + RULE_relationalExpression = 39 + RULE_additiveExpression = 40 + RULE_multiplicativeExpression = 41 + RULE_operationExpression = 42 + + ruleNames = [ "prog", "functionDefinition", "compoundStatement", "statement", + "declarationStatement", "forBlockStatement", "forSingleStatement", + "conditionClause", "whileBlockStatement", "whileSingleStatement", + "ifBlockStatement", "ifSingleStatement", "elseClause", + "switchStatement", "caseStatement", "functionCall", "arrayDeclarator", + "listInitializer", "emptyInitializer", "nullptr", "argumentList", + "returnStatement", "expressionStatement", "includeStatement", + "parameterList", "parameter", "typeSpec", "expression", + "defaultExpression", "breakExpression", "assignmentExpression", + "unaryExpression", "comparingExpression", "primaryExpression", + "pointerExpression", "assignmentOperator", "logicalOrExpression", + "logicalAndExpression", "equalityExpression", "relationalExpression", + "additiveExpression", "multiplicativeExpression", "operationExpression" ] + + EOF = Token.EOF + T__0=1 + T__1=2 + T__2=3 + T__3=4 + T__4=5 + T__5=6 + T__6=7 + T__7=8 + T__8=9 + T__9=10 + T__10=11 + T__11=12 + T__12=13 + T__13=14 + T__14=15 + T__15=16 + T__16=17 + T__17=18 + T__18=19 + T__19=20 + T__20=21 + T__21=22 + T__22=23 + T__23=24 + T__24=25 + T__25=26 + T__26=27 + T__27=28 + T__28=29 + T__29=30 + T__30=31 + T__31=32 + T__32=33 + T__33=34 + T__34=35 + T__35=36 + T__36=37 + T__37=38 + T__38=39 + T__39=40 + T__40=41 + T__41=42 + T__42=43 + T__43=44 + SL_COMMENT=45 + ML_COMMENT=46 + ID=47 + INT=48 + BOOL=49 + FLOAT=50 + CHAR=51 + POINTER=52 + STRING=53 + WS=54 + + def __init__(self, input:TokenStream, output:TextIO = sys.stdout): + super().__init__(input, output) + self.checkVersion("4.13.2") + self._interp = ParserATNSimulator(self, self.atn, self.decisionsToDFA, self.sharedContextCache) + self._predicates = None + + + + + class ProgContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def EOF(self): + return self.getToken(CASSParser.EOF, 0) + + def statement(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.StatementContext) + else: + return self.getTypedRuleContext(CASSParser.StatementContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_prog + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterProg" ): + listener.enterProg(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitProg" ): + listener.exitProg(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitProg" ): + return visitor.visitProg(self) + else: + return visitor.visitChildren(self) + + + + + def prog(self): + + localctx = CASSParser.ProgContext(self, self._ctx, self.state) + self.enterRule(localctx, 0, self.RULE_prog) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 87 + self._errHandler.sync(self) + _la = self._input.LA(1) + while True: + self.state = 86 + self.statement() + self.state = 89 + self._errHandler.sync(self) + _la = self._input.LA(1) + if not ((((_la) & ~0x3f) == 0 and ((1 << _la) & 17873665550719882) != 0)): + break + + self.state = 91 + self.match(CASSParser.EOF) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class FunctionDefinitionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def typeSpec(self): + return self.getTypedRuleContext(CASSParser.TypeSpecContext,0) + + + def primaryExpression(self): + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,0) + + + def compoundStatement(self): + return self.getTypedRuleContext(CASSParser.CompoundStatementContext,0) + + + def parameterList(self): + return self.getTypedRuleContext(CASSParser.ParameterListContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_functionDefinition + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterFunctionDefinition" ): + listener.enterFunctionDefinition(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitFunctionDefinition" ): + listener.exitFunctionDefinition(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitFunctionDefinition" ): + return visitor.visitFunctionDefinition(self) + else: + return visitor.visitChildren(self) + + + + + def functionDefinition(self): + + localctx = CASSParser.FunctionDefinitionContext(self, self._ctx, self.state) + self.enterRule(localctx, 2, self.RULE_functionDefinition) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 93 + self.typeSpec() + self.state = 94 + self.primaryExpression() + self.state = 95 + self.match(CASSParser.T__0) + self.state = 97 + self._errHandler.sync(self) + _la = self._input.LA(1) + if (((_la) & ~0x3f) == 0 and ((1 << _la) & 15728640) != 0): + self.state = 96 + self.parameterList() + + + self.state = 99 + self.match(CASSParser.T__1) + self.state = 100 + self.compoundStatement() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class CompoundStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def statement(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.StatementContext) + else: + return self.getTypedRuleContext(CASSParser.StatementContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_compoundStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterCompoundStatement" ): + listener.enterCompoundStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitCompoundStatement" ): + listener.exitCompoundStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitCompoundStatement" ): + return visitor.visitCompoundStatement(self) + else: + return visitor.visitChildren(self) + + + + + def compoundStatement(self): + + localctx = CASSParser.CompoundStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 4, self.RULE_compoundStatement) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 102 + self.match(CASSParser.T__2) + self.state = 106 + self._errHandler.sync(self) + _la = self._input.LA(1) + while (((_la) & ~0x3f) == 0 and ((1 << _la) & 17873665550719882) != 0): + self.state = 103 + self.statement() + self.state = 108 + self._errHandler.sync(self) + _la = self._input.LA(1) + + self.state = 109 + self.match(CASSParser.T__3) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class StatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def declarationStatement(self): + return self.getTypedRuleContext(CASSParser.DeclarationStatementContext,0) + + + def forBlockStatement(self): + return self.getTypedRuleContext(CASSParser.ForBlockStatementContext,0) + + + def forSingleStatement(self): + return self.getTypedRuleContext(CASSParser.ForSingleStatementContext,0) + + + def whileBlockStatement(self): + return self.getTypedRuleContext(CASSParser.WhileBlockStatementContext,0) + + + def whileSingleStatement(self): + return self.getTypedRuleContext(CASSParser.WhileSingleStatementContext,0) + + + def ifBlockStatement(self): + return self.getTypedRuleContext(CASSParser.IfBlockStatementContext,0) + + + def ifSingleStatement(self): + return self.getTypedRuleContext(CASSParser.IfSingleStatementContext,0) + + + def returnStatement(self): + return self.getTypedRuleContext(CASSParser.ReturnStatementContext,0) + + + def switchStatement(self): + return self.getTypedRuleContext(CASSParser.SwitchStatementContext,0) + + + def caseStatement(self): + return self.getTypedRuleContext(CASSParser.CaseStatementContext,0) + + + def expressionStatement(self): + return self.getTypedRuleContext(CASSParser.ExpressionStatementContext,0) + + + def functionDefinition(self): + return self.getTypedRuleContext(CASSParser.FunctionDefinitionContext,0) + + + def includeStatement(self): + return self.getTypedRuleContext(CASSParser.IncludeStatementContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_statement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterStatement" ): + listener.enterStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitStatement" ): + listener.exitStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitStatement" ): + return visitor.visitStatement(self) + else: + return visitor.visitChildren(self) + + + + + def statement(self): + + localctx = CASSParser.StatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 6, self.RULE_statement) + try: + self.state = 124 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,3,self._ctx) + if la_ == 1: + self.enterOuterAlt(localctx, 1) + self.state = 111 + self.declarationStatement() + pass + + elif la_ == 2: + self.enterOuterAlt(localctx, 2) + self.state = 112 + self.forBlockStatement() + pass + + elif la_ == 3: + self.enterOuterAlt(localctx, 3) + self.state = 113 + self.forSingleStatement() + pass + + elif la_ == 4: + self.enterOuterAlt(localctx, 4) + self.state = 114 + self.whileBlockStatement() + pass + + elif la_ == 5: + self.enterOuterAlt(localctx, 5) + self.state = 115 + self.whileSingleStatement() + pass + + elif la_ == 6: + self.enterOuterAlt(localctx, 6) + self.state = 116 + self.ifBlockStatement() + pass + + elif la_ == 7: + self.enterOuterAlt(localctx, 7) + self.state = 117 + self.ifSingleStatement() + pass + + elif la_ == 8: + self.enterOuterAlt(localctx, 8) + self.state = 118 + self.returnStatement() + pass + + elif la_ == 9: + self.enterOuterAlt(localctx, 9) + self.state = 119 + self.switchStatement() + pass + + elif la_ == 10: + self.enterOuterAlt(localctx, 10) + self.state = 120 + self.caseStatement() + pass + + elif la_ == 11: + self.enterOuterAlt(localctx, 11) + self.state = 121 + self.expressionStatement() + pass + + elif la_ == 12: + self.enterOuterAlt(localctx, 12) + self.state = 122 + self.functionDefinition() + pass + + elif la_ == 13: + self.enterOuterAlt(localctx, 13) + self.state = 123 + self.includeStatement() + pass + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class DeclarationStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def typeSpec(self): + return self.getTypedRuleContext(CASSParser.TypeSpecContext,0) + + + def primaryExpression(self): + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,0) + + + def arrayDeclarator(self): + return self.getTypedRuleContext(CASSParser.ArrayDeclaratorContext,0) + + + def POINTER(self, i:int=None): + if i is None: + return self.getTokens(CASSParser.POINTER) + else: + return self.getToken(CASSParser.POINTER, i) + + def expression(self): + return self.getTypedRuleContext(CASSParser.ExpressionContext,0) + + + def nullptr(self): + return self.getTypedRuleContext(CASSParser.NullptrContext,0) + + + def emptyInitializer(self): + return self.getTypedRuleContext(CASSParser.EmptyInitializerContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_declarationStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterDeclarationStatement" ): + listener.enterDeclarationStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitDeclarationStatement" ): + listener.exitDeclarationStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitDeclarationStatement" ): + return visitor.visitDeclarationStatement(self) + else: + return visitor.visitChildren(self) + + + + + def declarationStatement(self): + + localctx = CASSParser.DeclarationStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 8, self.RULE_declarationStatement) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 126 + self.typeSpec() + self.state = 130 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,4,self._ctx) + while _alt!=2 and _alt!=ATN.INVALID_ALT_NUMBER: + if _alt==1: + self.state = 127 + self.match(CASSParser.POINTER) + self.state = 132 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,4,self._ctx) + + self.state = 136 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,5,self._ctx) + if la_ == 1: + self.state = 133 + self.primaryExpression() + pass + + elif la_ == 2: + pass + + elif la_ == 3: + self.state = 135 + self.arrayDeclarator() + pass + + + self.state = 146 + self._errHandler.sync(self) + _la = self._input.LA(1) + if _la==5: + self.state = 138 + self.match(CASSParser.T__4) + self.state = 144 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,6,self._ctx) + if la_ == 1: + self.state = 139 + self.expression() + pass + + elif la_ == 2: + pass + + elif la_ == 3: + self.state = 141 + self.nullptr() + pass + + elif la_ == 4: + pass + + elif la_ == 5: + self.state = 143 + self.emptyInitializer() + pass + + + + + self.state = 149 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,8,self._ctx) + if la_ == 1: + self.state = 148 + self.match(CASSParser.T__5) + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ForBlockStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def logicalOrExpression(self): + return self.getTypedRuleContext(CASSParser.LogicalOrExpressionContext,0) + + + def unaryExpression(self): + return self.getTypedRuleContext(CASSParser.UnaryExpressionContext,0) + + + def compoundStatement(self): + return self.getTypedRuleContext(CASSParser.CompoundStatementContext,0) + + + def declarationStatement(self): + return self.getTypedRuleContext(CASSParser.DeclarationStatementContext,0) + + + def assignmentExpression(self): + return self.getTypedRuleContext(CASSParser.AssignmentExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_forBlockStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterForBlockStatement" ): + listener.enterForBlockStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitForBlockStatement" ): + listener.exitForBlockStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitForBlockStatement" ): + return visitor.visitForBlockStatement(self) + else: + return visitor.visitChildren(self) + + + + + def forBlockStatement(self): + + localctx = CASSParser.ForBlockStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 10, self.RULE_forBlockStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 151 + self.match(CASSParser.T__6) + self.state = 152 + self.match(CASSParser.T__0) + self.state = 156 + self._errHandler.sync(self) + token = self._input.LA(1) + if token in [20, 21, 22, 23]: + self.state = 153 + self.declarationStatement() + pass + elif token in [6]: + pass + elif token in [1, 3, 26, 27, 32, 47, 48, 49, 50, 51, 52, 53]: + self.state = 155 + self.assignmentExpression() + pass + else: + raise NoViableAltException(self) + + self.state = 158 + self.match(CASSParser.T__5) + self.state = 159 + self.logicalOrExpression() + self.state = 160 + self.match(CASSParser.T__5) + self.state = 161 + self.unaryExpression(0) + self.state = 162 + self.match(CASSParser.T__1) + self.state = 163 + self.compoundStatement() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ForSingleStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def logicalOrExpression(self): + return self.getTypedRuleContext(CASSParser.LogicalOrExpressionContext,0) + + + def unaryExpression(self): + return self.getTypedRuleContext(CASSParser.UnaryExpressionContext,0) + + + def statement(self): + return self.getTypedRuleContext(CASSParser.StatementContext,0) + + + def assignmentExpression(self): + return self.getTypedRuleContext(CASSParser.AssignmentExpressionContext,0) + + + def declarationStatement(self): + return self.getTypedRuleContext(CASSParser.DeclarationStatementContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_forSingleStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterForSingleStatement" ): + listener.enterForSingleStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitForSingleStatement" ): + listener.exitForSingleStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitForSingleStatement" ): + return visitor.visitForSingleStatement(self) + else: + return visitor.visitChildren(self) + + + + + def forSingleStatement(self): + + localctx = CASSParser.ForSingleStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 12, self.RULE_forSingleStatement) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 165 + self.match(CASSParser.T__6) + self.state = 166 + self.match(CASSParser.T__0) + self.state = 172 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,11,self._ctx) + if la_ == 1: + self.state = 168 + self._errHandler.sync(self) + _la = self._input.LA(1) + if (((_la) & ~0x3f) == 0 and ((1 << _la) & 15728640) != 0): + self.state = 167 + self.declarationStatement() + + + pass + + elif la_ == 2: + pass + + elif la_ == 3: + self.state = 171 + self.assignmentExpression() + pass + + + self.state = 174 + self.match(CASSParser.T__5) + self.state = 175 + self.logicalOrExpression() + self.state = 176 + self.match(CASSParser.T__5) + self.state = 177 + self.unaryExpression(0) + self.state = 178 + self.match(CASSParser.T__1) + self.state = 179 + self.statement() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ConditionClauseContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def logicalOrExpression(self): + return self.getTypedRuleContext(CASSParser.LogicalOrExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_conditionClause + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterConditionClause" ): + listener.enterConditionClause(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitConditionClause" ): + listener.exitConditionClause(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitConditionClause" ): + return visitor.visitConditionClause(self) + else: + return visitor.visitChildren(self) + + + + + def conditionClause(self): + + localctx = CASSParser.ConditionClauseContext(self, self._ctx, self.state) + self.enterRule(localctx, 14, self.RULE_conditionClause) + try: + self.enterOuterAlt(localctx, 1) + self.state = 181 + self.logicalOrExpression() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class WhileBlockStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def conditionClause(self): + return self.getTypedRuleContext(CASSParser.ConditionClauseContext,0) + + + def compoundStatement(self): + return self.getTypedRuleContext(CASSParser.CompoundStatementContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_whileBlockStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterWhileBlockStatement" ): + listener.enterWhileBlockStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitWhileBlockStatement" ): + listener.exitWhileBlockStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitWhileBlockStatement" ): + return visitor.visitWhileBlockStatement(self) + else: + return visitor.visitChildren(self) + + + + + def whileBlockStatement(self): + + localctx = CASSParser.WhileBlockStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 16, self.RULE_whileBlockStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 183 + self.match(CASSParser.T__7) + self.state = 184 + self.match(CASSParser.T__0) + self.state = 185 + self.conditionClause() + self.state = 186 + self.match(CASSParser.T__1) + self.state = 187 + self.compoundStatement() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class WhileSingleStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def conditionClause(self): + return self.getTypedRuleContext(CASSParser.ConditionClauseContext,0) + + + def statement(self): + return self.getTypedRuleContext(CASSParser.StatementContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_whileSingleStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterWhileSingleStatement" ): + listener.enterWhileSingleStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitWhileSingleStatement" ): + listener.exitWhileSingleStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitWhileSingleStatement" ): + return visitor.visitWhileSingleStatement(self) + else: + return visitor.visitChildren(self) + + + + + def whileSingleStatement(self): + + localctx = CASSParser.WhileSingleStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 18, self.RULE_whileSingleStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 189 + self.match(CASSParser.T__7) + self.state = 190 + self.match(CASSParser.T__0) + self.state = 191 + self.conditionClause() + self.state = 192 + self.match(CASSParser.T__1) + self.state = 193 + self.statement() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class IfBlockStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def conditionClause(self): + return self.getTypedRuleContext(CASSParser.ConditionClauseContext,0) + + + def compoundStatement(self): + return self.getTypedRuleContext(CASSParser.CompoundStatementContext,0) + + + def elseClause(self): + return self.getTypedRuleContext(CASSParser.ElseClauseContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_ifBlockStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterIfBlockStatement" ): + listener.enterIfBlockStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitIfBlockStatement" ): + listener.exitIfBlockStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitIfBlockStatement" ): + return visitor.visitIfBlockStatement(self) + else: + return visitor.visitChildren(self) + + + + + def ifBlockStatement(self): + + localctx = CASSParser.IfBlockStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 20, self.RULE_ifBlockStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 195 + self.match(CASSParser.T__8) + self.state = 196 + self.match(CASSParser.T__0) + self.state = 197 + self.conditionClause() + self.state = 198 + self.match(CASSParser.T__1) + self.state = 199 + self.compoundStatement() + self.state = 201 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,12,self._ctx) + if la_ == 1: + self.state = 200 + self.elseClause() + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class IfSingleStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def conditionClause(self): + return self.getTypedRuleContext(CASSParser.ConditionClauseContext,0) + + + def statement(self): + return self.getTypedRuleContext(CASSParser.StatementContext,0) + + + def elseClause(self): + return self.getTypedRuleContext(CASSParser.ElseClauseContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_ifSingleStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterIfSingleStatement" ): + listener.enterIfSingleStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitIfSingleStatement" ): + listener.exitIfSingleStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitIfSingleStatement" ): + return visitor.visitIfSingleStatement(self) + else: + return visitor.visitChildren(self) + + + + + def ifSingleStatement(self): + + localctx = CASSParser.IfSingleStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 22, self.RULE_ifSingleStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 203 + self.match(CASSParser.T__8) + self.state = 204 + self.match(CASSParser.T__0) + self.state = 205 + self.conditionClause() + self.state = 206 + self.match(CASSParser.T__1) + self.state = 207 + self.statement() + self.state = 209 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,13,self._ctx) + if la_ == 1: + self.state = 208 + self.elseClause() + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ElseClauseContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def compoundStatement(self): + return self.getTypedRuleContext(CASSParser.CompoundStatementContext,0) + + + def ifBlockStatement(self): + return self.getTypedRuleContext(CASSParser.IfBlockStatementContext,0) + + + def statement(self): + return self.getTypedRuleContext(CASSParser.StatementContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_elseClause + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterElseClause" ): + listener.enterElseClause(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitElseClause" ): + listener.exitElseClause(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitElseClause" ): + return visitor.visitElseClause(self) + else: + return visitor.visitChildren(self) + + + + + def elseClause(self): + + localctx = CASSParser.ElseClauseContext(self, self._ctx, self.state) + self.enterRule(localctx, 24, self.RULE_elseClause) + try: + self.enterOuterAlt(localctx, 1) + self.state = 211 + self.match(CASSParser.T__9) + self.state = 215 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,14,self._ctx) + if la_ == 1: + self.state = 212 + self.compoundStatement() + pass + + elif la_ == 2: + self.state = 213 + self.ifBlockStatement() + pass + + elif la_ == 3: + self.state = 214 + self.statement() + pass + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class SwitchStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def conditionClause(self): + return self.getTypedRuleContext(CASSParser.ConditionClauseContext,0) + + + def compoundStatement(self): + return self.getTypedRuleContext(CASSParser.CompoundStatementContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_switchStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterSwitchStatement" ): + listener.enterSwitchStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitSwitchStatement" ): + listener.exitSwitchStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitSwitchStatement" ): + return visitor.visitSwitchStatement(self) + else: + return visitor.visitChildren(self) + + + + + def switchStatement(self): + + localctx = CASSParser.SwitchStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 26, self.RULE_switchStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 217 + self.match(CASSParser.T__10) + self.state = 218 + self.match(CASSParser.T__0) + self.state = 219 + self.conditionClause() + self.state = 220 + self.match(CASSParser.T__1) + self.state = 221 + self.compoundStatement() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class CaseStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def defaultExpression(self): + return self.getTypedRuleContext(CASSParser.DefaultExpressionContext,0) + + + def primaryExpression(self): + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,0) + + + def statement(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.StatementContext) + else: + return self.getTypedRuleContext(CASSParser.StatementContext,i) + + + def breakExpression(self): + return self.getTypedRuleContext(CASSParser.BreakExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_caseStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterCaseStatement" ): + listener.enterCaseStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitCaseStatement" ): + listener.exitCaseStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitCaseStatement" ): + return visitor.visitCaseStatement(self) + else: + return visitor.visitChildren(self) + + + + + def caseStatement(self): + + localctx = CASSParser.CaseStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 28, self.RULE_caseStatement) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 225 + self._errHandler.sync(self) + token = self._input.LA(1) + if token in [12]: + self.state = 223 + self.match(CASSParser.T__11) + pass + elif token in [24]: + self.state = 224 + self.defaultExpression() + pass + else: + raise NoViableAltException(self) + + self.state = 228 + self._errHandler.sync(self) + _la = self._input.LA(1) + if (((_la) & ~0x3f) == 0 and ((1 << _la) & 13370061393756162) != 0): + self.state = 227 + self.primaryExpression() + + + self.state = 230 + self.match(CASSParser.T__12) + self.state = 234 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,17,self._ctx) + while _alt!=2 and _alt!=ATN.INVALID_ALT_NUMBER: + if _alt==1: + self.state = 231 + self.statement() + self.state = 236 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,17,self._ctx) + + self.state = 238 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,18,self._ctx) + if la_ == 1: + self.state = 237 + self.breakExpression() + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class FunctionCallContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def ID(self): + return self.getToken(CASSParser.ID, 0) + + def argumentList(self): + return self.getTypedRuleContext(CASSParser.ArgumentListContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_functionCall + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterFunctionCall" ): + listener.enterFunctionCall(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitFunctionCall" ): + listener.exitFunctionCall(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitFunctionCall" ): + return visitor.visitFunctionCall(self) + else: + return visitor.visitChildren(self) + + + + + def functionCall(self): + + localctx = CASSParser.FunctionCallContext(self, self._ctx, self.state) + self.enterRule(localctx, 30, self.RULE_functionCall) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 240 + self.match(CASSParser.ID) + self.state = 241 + self.match(CASSParser.T__0) + self.state = 243 + self._errHandler.sync(self) + _la = self._input.LA(1) + if (((_la) & ~0x3f) == 0 and ((1 << _la) & 17873665517420554) != 0): + self.state = 242 + self.argumentList() + + + self.state = 245 + self.match(CASSParser.T__1) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ArrayDeclaratorContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def primaryExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.PrimaryExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_arrayDeclarator + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterArrayDeclarator" ): + listener.enterArrayDeclarator(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitArrayDeclarator" ): + listener.exitArrayDeclarator(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitArrayDeclarator" ): + return visitor.visitArrayDeclarator(self) + else: + return visitor.visitChildren(self) + + + + + def arrayDeclarator(self): + + localctx = CASSParser.ArrayDeclaratorContext(self, self._ctx, self.state) + self.enterRule(localctx, 32, self.RULE_arrayDeclarator) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 247 + self.primaryExpression() + self.state = 248 + self.match(CASSParser.T__13) + self.state = 250 + self._errHandler.sync(self) + _la = self._input.LA(1) + if (((_la) & ~0x3f) == 0 and ((1 << _la) & 13370061393756162) != 0): + self.state = 249 + self.primaryExpression() + + + self.state = 252 + self.match(CASSParser.T__14) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ListInitializerContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def primaryExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.PrimaryExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_listInitializer + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterListInitializer" ): + listener.enterListInitializer(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitListInitializer" ): + listener.exitListInitializer(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitListInitializer" ): + return visitor.visitListInitializer(self) + else: + return visitor.visitChildren(self) + + + + + def listInitializer(self): + + localctx = CASSParser.ListInitializerContext(self, self._ctx, self.state) + self.enterRule(localctx, 34, self.RULE_listInitializer) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 254 + self.match(CASSParser.T__2) + self.state = 255 + self.primaryExpression() + self.state = 260 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==16: + self.state = 256 + self.match(CASSParser.T__15) + self.state = 257 + self.primaryExpression() + self.state = 262 + self._errHandler.sync(self) + _la = self._input.LA(1) + + self.state = 263 + self.match(CASSParser.T__3) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class EmptyInitializerContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_emptyInitializer + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterEmptyInitializer" ): + listener.enterEmptyInitializer(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitEmptyInitializer" ): + listener.exitEmptyInitializer(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitEmptyInitializer" ): + return visitor.visitEmptyInitializer(self) + else: + return visitor.visitChildren(self) + + + + + def emptyInitializer(self): + + localctx = CASSParser.EmptyInitializerContext(self, self._ctx, self.state) + self.enterRule(localctx, 36, self.RULE_emptyInitializer) + try: + self.enterOuterAlt(localctx, 1) + self.state = 265 + self.match(CASSParser.T__2) + self.state = 266 + self.match(CASSParser.T__3) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class NullptrContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_nullptr + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterNullptr" ): + listener.enterNullptr(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitNullptr" ): + listener.exitNullptr(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitNullptr" ): + return visitor.visitNullptr(self) + else: + return visitor.visitChildren(self) + + + + + def nullptr(self): + + localctx = CASSParser.NullptrContext(self, self._ctx, self.state) + self.enterRule(localctx, 38, self.RULE_nullptr) + try: + self.enterOuterAlt(localctx, 1) + self.state = 268 + self.match(CASSParser.T__16) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ArgumentListContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def expression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.ExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.ExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_argumentList + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterArgumentList" ): + listener.enterArgumentList(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitArgumentList" ): + listener.exitArgumentList(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitArgumentList" ): + return visitor.visitArgumentList(self) + else: + return visitor.visitChildren(self) + + + + + def argumentList(self): + + localctx = CASSParser.ArgumentListContext(self, self._ctx, self.state) + self.enterRule(localctx, 40, self.RULE_argumentList) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 270 + self.expression() + self.state = 275 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==16: + self.state = 271 + self.match(CASSParser.T__15) + self.state = 272 + self.expression() + self.state = 277 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ReturnStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def expression(self): + return self.getTypedRuleContext(CASSParser.ExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_returnStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterReturnStatement" ): + listener.enterReturnStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitReturnStatement" ): + listener.exitReturnStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitReturnStatement" ): + return visitor.visitReturnStatement(self) + else: + return visitor.visitChildren(self) + + + + + def returnStatement(self): + + localctx = CASSParser.ReturnStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 42, self.RULE_returnStatement) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 278 + self.match(CASSParser.T__17) + self.state = 280 + self._errHandler.sync(self) + _la = self._input.LA(1) + if (((_la) & ~0x3f) == 0 and ((1 << _la) & 17873665517420554) != 0): + self.state = 279 + self.expression() + + + self.state = 282 + self.match(CASSParser.T__5) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ExpressionStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def expression(self): + return self.getTypedRuleContext(CASSParser.ExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_expressionStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterExpressionStatement" ): + listener.enterExpressionStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitExpressionStatement" ): + listener.exitExpressionStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitExpressionStatement" ): + return visitor.visitExpressionStatement(self) + else: + return visitor.visitChildren(self) + + + + + def expressionStatement(self): + + localctx = CASSParser.ExpressionStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 44, self.RULE_expressionStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 284 + self.expression() + self.state = 285 + self.match(CASSParser.T__5) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class IncludeStatementContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def STRING(self): + return self.getToken(CASSParser.STRING, 0) + + def getRuleIndex(self): + return CASSParser.RULE_includeStatement + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterIncludeStatement" ): + listener.enterIncludeStatement(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitIncludeStatement" ): + listener.exitIncludeStatement(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitIncludeStatement" ): + return visitor.visitIncludeStatement(self) + else: + return visitor.visitChildren(self) + + + + + def includeStatement(self): + + localctx = CASSParser.IncludeStatementContext(self, self._ctx, self.state) + self.enterRule(localctx, 46, self.RULE_includeStatement) + try: + self.enterOuterAlt(localctx, 1) + self.state = 287 + self.match(CASSParser.T__18) + self.state = 288 + self.match(CASSParser.STRING) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ParameterListContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def parameter(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.ParameterContext) + else: + return self.getTypedRuleContext(CASSParser.ParameterContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_parameterList + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterParameterList" ): + listener.enterParameterList(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitParameterList" ): + listener.exitParameterList(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitParameterList" ): + return visitor.visitParameterList(self) + else: + return visitor.visitChildren(self) + + + + + def parameterList(self): + + localctx = CASSParser.ParameterListContext(self, self._ctx, self.state) + self.enterRule(localctx, 48, self.RULE_parameterList) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 290 + self.parameter() + self.state = 295 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==16: + self.state = 291 + self.match(CASSParser.T__15) + self.state = 292 + self.parameter() + self.state = 297 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ParameterContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def typeSpec(self): + return self.getTypedRuleContext(CASSParser.TypeSpecContext,0) + + + def primaryExpression(self): + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_parameter + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterParameter" ): + listener.enterParameter(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitParameter" ): + listener.exitParameter(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitParameter" ): + return visitor.visitParameter(self) + else: + return visitor.visitChildren(self) + + + + + def parameter(self): + + localctx = CASSParser.ParameterContext(self, self._ctx, self.state) + self.enterRule(localctx, 50, self.RULE_parameter) + try: + self.enterOuterAlt(localctx, 1) + self.state = 298 + self.typeSpec() + self.state = 299 + self.primaryExpression() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class TypeSpecContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_typeSpec + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterTypeSpec" ): + listener.enterTypeSpec(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitTypeSpec" ): + listener.exitTypeSpec(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitTypeSpec" ): + return visitor.visitTypeSpec(self) + else: + return visitor.visitChildren(self) + + + + + def typeSpec(self): + + localctx = CASSParser.TypeSpecContext(self, self._ctx, self.state) + self.enterRule(localctx, 52, self.RULE_typeSpec) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 301 + _la = self._input.LA(1) + if not((((_la) & ~0x3f) == 0 and ((1 << _la) & 15728640) != 0)): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class ExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def assignmentExpression(self): + return self.getTypedRuleContext(CASSParser.AssignmentExpressionContext,0) + + + def functionCall(self): + return self.getTypedRuleContext(CASSParser.FunctionCallContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_expression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterExpression" ): + listener.enterExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitExpression" ): + listener.exitExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitExpression" ): + return visitor.visitExpression(self) + else: + return visitor.visitChildren(self) + + + + + def expression(self): + + localctx = CASSParser.ExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 54, self.RULE_expression) + try: + self.state = 305 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,25,self._ctx) + if la_ == 1: + self.enterOuterAlt(localctx, 1) + self.state = 303 + self.assignmentExpression() + pass + + elif la_ == 2: + self.enterOuterAlt(localctx, 2) + self.state = 304 + self.functionCall() + pass + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class DefaultExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_defaultExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterDefaultExpression" ): + listener.enterDefaultExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitDefaultExpression" ): + listener.exitDefaultExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitDefaultExpression" ): + return visitor.visitDefaultExpression(self) + else: + return visitor.visitChildren(self) + + + + + def defaultExpression(self): + + localctx = CASSParser.DefaultExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 56, self.RULE_defaultExpression) + try: + self.enterOuterAlt(localctx, 1) + self.state = 307 + self.match(CASSParser.T__23) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class BreakExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_breakExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterBreakExpression" ): + listener.enterBreakExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitBreakExpression" ): + listener.exitBreakExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitBreakExpression" ): + return visitor.visitBreakExpression(self) + else: + return visitor.visitChildren(self) + + + + + def breakExpression(self): + + localctx = CASSParser.BreakExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 58, self.RULE_breakExpression) + try: + self.enterOuterAlt(localctx, 1) + self.state = 309 + self.match(CASSParser.T__24) + self.state = 310 + self.match(CASSParser.T__5) + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class AssignmentExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def unaryExpression(self): + return self.getTypedRuleContext(CASSParser.UnaryExpressionContext,0) + + + def assignmentOperator(self): + return self.getTypedRuleContext(CASSParser.AssignmentOperatorContext,0) + + + def assignmentExpression(self): + return self.getTypedRuleContext(CASSParser.AssignmentExpressionContext,0) + + + def nullptr(self): + return self.getTypedRuleContext(CASSParser.NullptrContext,0) + + + def emptyInitializer(self): + return self.getTypedRuleContext(CASSParser.EmptyInitializerContext,0) + + + def logicalOrExpression(self): + return self.getTypedRuleContext(CASSParser.LogicalOrExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_assignmentExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterAssignmentExpression" ): + listener.enterAssignmentExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitAssignmentExpression" ): + listener.exitAssignmentExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitAssignmentExpression" ): + return visitor.visitAssignmentExpression(self) + else: + return visitor.visitChildren(self) + + + + + def assignmentExpression(self): + + localctx = CASSParser.AssignmentExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 60, self.RULE_assignmentExpression) + try: + self.state = 322 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,28,self._ctx) + if la_ == 1: + self.enterOuterAlt(localctx, 1) + self.state = 312 + self.unaryExpression(0) + self.state = 313 + self.assignmentOperator() + self.state = 314 + self.assignmentExpression() + self.state = 316 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,26,self._ctx) + if la_ == 1: + self.state = 315 + self.nullptr() + + + self.state = 319 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,27,self._ctx) + if la_ == 1: + self.state = 318 + self.emptyInitializer() + + + pass + + elif la_ == 2: + self.enterOuterAlt(localctx, 2) + self.state = 321 + self.logicalOrExpression() + pass + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class UnaryExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def unaryExpression(self): + return self.getTypedRuleContext(CASSParser.UnaryExpressionContext,0) + + + def pointerExpression(self): + return self.getTypedRuleContext(CASSParser.PointerExpressionContext,0) + + + def primaryExpression(self): + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,0) + + + def listInitializer(self): + return self.getTypedRuleContext(CASSParser.ListInitializerContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_unaryExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterUnaryExpression" ): + listener.enterUnaryExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitUnaryExpression" ): + listener.exitUnaryExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitUnaryExpression" ): + return visitor.visitUnaryExpression(self) + else: + return visitor.visitChildren(self) + + + + def unaryExpression(self, _p:int=0): + _parentctx = self._ctx + _parentState = self.state + localctx = CASSParser.UnaryExpressionContext(self, self._ctx, _parentState) + _prevctx = localctx + _startState = 62 + self.enterRecursionRule(localctx, 62, self.RULE_unaryExpression, _p) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 330 + self._errHandler.sync(self) + token = self._input.LA(1) + if token in [26, 27]: + self.state = 325 + _la = self._input.LA(1) + if not(_la==26 or _la==27): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + self.state = 326 + self.unaryExpression(5) + pass + elif token in [32, 52]: + self.state = 327 + self.pointerExpression() + pass + elif token in [1, 47, 48, 49, 50, 51, 53]: + self.state = 328 + self.primaryExpression() + pass + elif token in [3]: + self.state = 329 + self.listInitializer() + pass + else: + raise NoViableAltException(self) + + self._ctx.stop = self._input.LT(-1) + self.state = 336 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,30,self._ctx) + while _alt!=2 and _alt!=ATN.INVALID_ALT_NUMBER: + if _alt==1: + if self._parseListeners is not None: + self.triggerExitRuleEvent() + _prevctx = localctx + localctx = CASSParser.UnaryExpressionContext(self, _parentctx, _parentState) + self.pushNewRecursionContext(localctx, _startState, self.RULE_unaryExpression) + self.state = 332 + if not self.precpred(self._ctx, 4): + from antlr4.error.Errors import FailedPredicateException + raise FailedPredicateException(self, "self.precpred(self._ctx, 4)") + self.state = 333 + _la = self._input.LA(1) + if not(_la==26 or _la==27): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + self.state = 338 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,30,self._ctx) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.unrollRecursionContexts(_parentctx) + return localctx + + + class ComparingExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_comparingExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterComparingExpression" ): + listener.enterComparingExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitComparingExpression" ): + listener.exitComparingExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitComparingExpression" ): + return visitor.visitComparingExpression(self) + else: + return visitor.visitChildren(self) + + + + + def comparingExpression(self): + + localctx = CASSParser.ComparingExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 64, self.RULE_comparingExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 339 + _la = self._input.LA(1) + if not((((_la) & ~0x3f) == 0 and ((1 << _la) & 4026531840) != 0)): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class PrimaryExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def ID(self): + return self.getToken(CASSParser.ID, 0) + + def INT(self): + return self.getToken(CASSParser.INT, 0) + + def FLOAT(self): + return self.getToken(CASSParser.FLOAT, 0) + + def CHAR(self): + return self.getToken(CASSParser.CHAR, 0) + + def STRING(self): + return self.getToken(CASSParser.STRING, 0) + + def BOOL(self): + return self.getToken(CASSParser.BOOL, 0) + + def functionCall(self): + return self.getTypedRuleContext(CASSParser.FunctionCallContext,0) + + + def expression(self): + return self.getTypedRuleContext(CASSParser.ExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_primaryExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterPrimaryExpression" ): + listener.enterPrimaryExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitPrimaryExpression" ): + listener.exitPrimaryExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitPrimaryExpression" ): + return visitor.visitPrimaryExpression(self) + else: + return visitor.visitChildren(self) + + + + + def primaryExpression(self): + + localctx = CASSParser.PrimaryExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 66, self.RULE_primaryExpression) + try: + self.state = 352 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,31,self._ctx) + if la_ == 1: + self.enterOuterAlt(localctx, 1) + self.state = 341 + self.match(CASSParser.ID) + pass + + elif la_ == 2: + self.enterOuterAlt(localctx, 2) + self.state = 342 + self.match(CASSParser.INT) + pass + + elif la_ == 3: + self.enterOuterAlt(localctx, 3) + self.state = 343 + self.match(CASSParser.FLOAT) + pass + + elif la_ == 4: + self.enterOuterAlt(localctx, 4) + self.state = 344 + self.match(CASSParser.CHAR) + pass + + elif la_ == 5: + self.enterOuterAlt(localctx, 5) + self.state = 345 + self.match(CASSParser.STRING) + pass + + elif la_ == 6: + self.enterOuterAlt(localctx, 6) + self.state = 346 + self.match(CASSParser.BOOL) + pass + + elif la_ == 7: + self.enterOuterAlt(localctx, 7) + self.state = 347 + self.functionCall() + pass + + elif la_ == 8: + self.enterOuterAlt(localctx, 8) + self.state = 348 + self.match(CASSParser.T__0) + self.state = 349 + self.expression() + self.state = 350 + self.match(CASSParser.T__1) + pass + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class PointerExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def primaryExpression(self): + return self.getTypedRuleContext(CASSParser.PrimaryExpressionContext,0) + + + def POINTER(self): + return self.getToken(CASSParser.POINTER, 0) + + def getRuleIndex(self): + return CASSParser.RULE_pointerExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterPointerExpression" ): + listener.enterPointerExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitPointerExpression" ): + listener.exitPointerExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitPointerExpression" ): + return visitor.visitPointerExpression(self) + else: + return visitor.visitChildren(self) + + + + + def pointerExpression(self): + + localctx = CASSParser.PointerExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 68, self.RULE_pointerExpression) + try: + self.state = 358 + self._errHandler.sync(self) + token = self._input.LA(1) + if token in [32]: + self.enterOuterAlt(localctx, 1) + self.state = 354 + self.match(CASSParser.T__31) + self.state = 355 + self.primaryExpression() + pass + elif token in [52]: + self.enterOuterAlt(localctx, 2) + self.state = 356 + self.match(CASSParser.POINTER) + self.state = 357 + self.primaryExpression() + pass + else: + raise NoViableAltException(self) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class AssignmentOperatorContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + + def getRuleIndex(self): + return CASSParser.RULE_assignmentOperator + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterAssignmentOperator" ): + listener.enterAssignmentOperator(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitAssignmentOperator" ): + listener.exitAssignmentOperator(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitAssignmentOperator" ): + return visitor.visitAssignmentOperator(self) + else: + return visitor.visitChildren(self) + + + + + def assignmentOperator(self): + + localctx = CASSParser.AssignmentOperatorContext(self, self._ctx, self.state) + self.enterRule(localctx, 70, self.RULE_assignmentOperator) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 360 + _la = self._input.LA(1) + if not((((_la) & ~0x3f) == 0 and ((1 << _la) & 128849018912) != 0)): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class LogicalOrExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def logicalAndExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.LogicalAndExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.LogicalAndExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_logicalOrExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterLogicalOrExpression" ): + listener.enterLogicalOrExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitLogicalOrExpression" ): + listener.exitLogicalOrExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitLogicalOrExpression" ): + return visitor.visitLogicalOrExpression(self) + else: + return visitor.visitChildren(self) + + + + + def logicalOrExpression(self): + + localctx = CASSParser.LogicalOrExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 72, self.RULE_logicalOrExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 362 + self.logicalAndExpression() + self.state = 367 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==37: + self.state = 363 + self.match(CASSParser.T__36) + self.state = 364 + self.logicalAndExpression() + self.state = 369 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class LogicalAndExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def equalityExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.EqualityExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.EqualityExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_logicalAndExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterLogicalAndExpression" ): + listener.enterLogicalAndExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitLogicalAndExpression" ): + listener.exitLogicalAndExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitLogicalAndExpression" ): + return visitor.visitLogicalAndExpression(self) + else: + return visitor.visitChildren(self) + + + + + def logicalAndExpression(self): + + localctx = CASSParser.LogicalAndExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 74, self.RULE_logicalAndExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 370 + self.equalityExpression() + self.state = 375 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==38: + self.state = 371 + self.match(CASSParser.T__37) + self.state = 372 + self.equalityExpression() + self.state = 377 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class EqualityExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def relationalExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.RelationalExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.RelationalExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_equalityExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterEqualityExpression" ): + listener.enterEqualityExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitEqualityExpression" ): + listener.exitEqualityExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitEqualityExpression" ): + return visitor.visitEqualityExpression(self) + else: + return visitor.visitChildren(self) + + + + + def equalityExpression(self): + + localctx = CASSParser.EqualityExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 76, self.RULE_equalityExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 378 + self.relationalExpression() + self.state = 383 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==39 or _la==40: + self.state = 379 + _la = self._input.LA(1) + if not(_la==39 or _la==40): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + self.state = 380 + self.relationalExpression() + self.state = 385 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class RelationalExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def additiveExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.AdditiveExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.AdditiveExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_relationalExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterRelationalExpression" ): + listener.enterRelationalExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitRelationalExpression" ): + listener.exitRelationalExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitRelationalExpression" ): + return visitor.visitRelationalExpression(self) + else: + return visitor.visitChildren(self) + + + + + def relationalExpression(self): + + localctx = CASSParser.RelationalExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 78, self.RULE_relationalExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 386 + self.additiveExpression() + self.state = 391 + self._errHandler.sync(self) + _la = self._input.LA(1) + while (((_la) & ~0x3f) == 0 and ((1 << _la) & 4026531840) != 0): + self.state = 387 + _la = self._input.LA(1) + if not((((_la) & ~0x3f) == 0 and ((1 << _la) & 4026531840) != 0)): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + self.state = 388 + self.additiveExpression() + self.state = 393 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class AdditiveExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def multiplicativeExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.MultiplicativeExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.MultiplicativeExpressionContext,i) + + + def getRuleIndex(self): + return CASSParser.RULE_additiveExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterAdditiveExpression" ): + listener.enterAdditiveExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitAdditiveExpression" ): + listener.exitAdditiveExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitAdditiveExpression" ): + return visitor.visitAdditiveExpression(self) + else: + return visitor.visitChildren(self) + + + + + def additiveExpression(self): + + localctx = CASSParser.AdditiveExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 80, self.RULE_additiveExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 394 + self.multiplicativeExpression() + self.state = 399 + self._errHandler.sync(self) + _la = self._input.LA(1) + while _la==41 or _la==42: + self.state = 395 + _la = self._input.LA(1) + if not(_la==41 or _la==42): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + self.state = 396 + self.multiplicativeExpression() + self.state = 401 + self._errHandler.sync(self) + _la = self._input.LA(1) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class MultiplicativeExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def unaryExpression(self, i:int=None): + if i is None: + return self.getTypedRuleContexts(CASSParser.UnaryExpressionContext) + else: + return self.getTypedRuleContext(CASSParser.UnaryExpressionContext,i) + + + def POINTER(self, i:int=None): + if i is None: + return self.getTokens(CASSParser.POINTER) + else: + return self.getToken(CASSParser.POINTER, i) + + def getRuleIndex(self): + return CASSParser.RULE_multiplicativeExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterMultiplicativeExpression" ): + listener.enterMultiplicativeExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitMultiplicativeExpression" ): + listener.exitMultiplicativeExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitMultiplicativeExpression" ): + return visitor.visitMultiplicativeExpression(self) + else: + return visitor.visitChildren(self) + + + + + def multiplicativeExpression(self): + + localctx = CASSParser.MultiplicativeExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 82, self.RULE_multiplicativeExpression) + self._la = 0 # Token type + try: + self.enterOuterAlt(localctx, 1) + self.state = 402 + self.unaryExpression(0) + self.state = 407 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,38,self._ctx) + while _alt!=2 and _alt!=ATN.INVALID_ALT_NUMBER: + if _alt==1: + self.state = 403 + _la = self._input.LA(1) + if not((((_la) & ~0x3f) == 0 and ((1 << _la) & 4529987906437120) != 0)): + self._errHandler.recoverInline(self) + else: + self._errHandler.reportMatch(self) + self.consume() + self.state = 404 + self.unaryExpression(0) + self.state = 409 + self._errHandler.sync(self) + _alt = self._interp.adaptivePredict(self._input,38,self._ctx) + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + class OperationExpressionContext(ParserRuleContext): + __slots__ = 'parser' + + def __init__(self, parser, parent:ParserRuleContext=None, invokingState:int=-1): + super().__init__(parent, invokingState) + self.parser = parser + + def additiveExpression(self): + return self.getTypedRuleContext(CASSParser.AdditiveExpressionContext,0) + + + def multiplicativeExpression(self): + return self.getTypedRuleContext(CASSParser.MultiplicativeExpressionContext,0) + + + def getRuleIndex(self): + return CASSParser.RULE_operationExpression + + def enterRule(self, listener:ParseTreeListener): + if hasattr( listener, "enterOperationExpression" ): + listener.enterOperationExpression(self) + + def exitRule(self, listener:ParseTreeListener): + if hasattr( listener, "exitOperationExpression" ): + listener.exitOperationExpression(self) + + def accept(self, visitor:ParseTreeVisitor): + if hasattr( visitor, "visitOperationExpression" ): + return visitor.visitOperationExpression(self) + else: + return visitor.visitChildren(self) + + + + + def operationExpression(self): + + localctx = CASSParser.OperationExpressionContext(self, self._ctx, self.state) + self.enterRule(localctx, 84, self.RULE_operationExpression) + try: + self.state = 412 + self._errHandler.sync(self) + la_ = self._interp.adaptivePredict(self._input,39,self._ctx) + if la_ == 1: + self.enterOuterAlt(localctx, 1) + self.state = 410 + self.additiveExpression() + pass + + elif la_ == 2: + self.enterOuterAlt(localctx, 2) + self.state = 411 + self.multiplicativeExpression() + pass + + + except RecognitionException as re: + localctx.exception = re + self._errHandler.reportError(self, re) + self._errHandler.recover(self, re) + finally: + self.exitRule() + return localctx + + + + def sempred(self, localctx:RuleContext, ruleIndex:int, predIndex:int): + if self._predicates == None: + self._predicates = dict() + self._predicates[31] = self.unaryExpression_sempred + pred = self._predicates.get(ruleIndex, None) + if pred is None: + raise Exception("No predicate with index:" + str(ruleIndex)) + else: + return pred(localctx, predIndex) + + def unaryExpression_sempred(self, localctx:UnaryExpressionContext, predIndex:int): + if predIndex == 0: + return self.precpred(self._ctx, 4) + + + + + diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSVisitor.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSVisitor.py new file mode 100644 index 00000000000..5c819a85b87 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASSVisitor.py @@ -0,0 +1,228 @@ +# Generated from CASS.g4 by ANTLR 4.13.2 +from antlr4 import * +if "." in __name__: + from .CASSParser import CASSParser +else: + from CASSParser import CASSParser + +# This class defines a complete generic visitor for a parse tree produced by CASSParser. + +class CASSVisitor(ParseTreeVisitor): + + # Visit a parse tree produced by CASSParser#prog. + def visitProg(self, ctx:CASSParser.ProgContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#functionDefinition. + def visitFunctionDefinition(self, ctx:CASSParser.FunctionDefinitionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#compoundStatement. + def visitCompoundStatement(self, ctx:CASSParser.CompoundStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#statement. + def visitStatement(self, ctx:CASSParser.StatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#declarationStatement. + def visitDeclarationStatement(self, ctx:CASSParser.DeclarationStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#forBlockStatement. + def visitForBlockStatement(self, ctx:CASSParser.ForBlockStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#forSingleStatement. + def visitForSingleStatement(self, ctx:CASSParser.ForSingleStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#conditionClause. + def visitConditionClause(self, ctx:CASSParser.ConditionClauseContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#whileBlockStatement. + def visitWhileBlockStatement(self, ctx:CASSParser.WhileBlockStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#whileSingleStatement. + def visitWhileSingleStatement(self, ctx:CASSParser.WhileSingleStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#ifBlockStatement. + def visitIfBlockStatement(self, ctx:CASSParser.IfBlockStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#ifSingleStatement. + def visitIfSingleStatement(self, ctx:CASSParser.IfSingleStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#elseClause. + def visitElseClause(self, ctx:CASSParser.ElseClauseContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#switchStatement. + def visitSwitchStatement(self, ctx:CASSParser.SwitchStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#caseStatement. + def visitCaseStatement(self, ctx:CASSParser.CaseStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#functionCall. + def visitFunctionCall(self, ctx:CASSParser.FunctionCallContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#arrayDeclarator. + def visitArrayDeclarator(self, ctx:CASSParser.ArrayDeclaratorContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#listInitializer. + def visitListInitializer(self, ctx:CASSParser.ListInitializerContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#emptyInitializer. + def visitEmptyInitializer(self, ctx:CASSParser.EmptyInitializerContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#nullptr. + def visitNullptr(self, ctx:CASSParser.NullptrContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#argumentList. + def visitArgumentList(self, ctx:CASSParser.ArgumentListContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#returnStatement. + def visitReturnStatement(self, ctx:CASSParser.ReturnStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#expressionStatement. + def visitExpressionStatement(self, ctx:CASSParser.ExpressionStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#includeStatement. + def visitIncludeStatement(self, ctx:CASSParser.IncludeStatementContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#parameterList. + def visitParameterList(self, ctx:CASSParser.ParameterListContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#parameter. + def visitParameter(self, ctx:CASSParser.ParameterContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#typeSpec. + def visitTypeSpec(self, ctx:CASSParser.TypeSpecContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#expression. + def visitExpression(self, ctx:CASSParser.ExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#defaultExpression. + def visitDefaultExpression(self, ctx:CASSParser.DefaultExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#breakExpression. + def visitBreakExpression(self, ctx:CASSParser.BreakExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#assignmentExpression. + def visitAssignmentExpression(self, ctx:CASSParser.AssignmentExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#unaryExpression. + def visitUnaryExpression(self, ctx:CASSParser.UnaryExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#comparingExpression. + def visitComparingExpression(self, ctx:CASSParser.ComparingExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#primaryExpression. + def visitPrimaryExpression(self, ctx:CASSParser.PrimaryExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#pointerExpression. + def visitPointerExpression(self, ctx:CASSParser.PointerExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#assignmentOperator. + def visitAssignmentOperator(self, ctx:CASSParser.AssignmentOperatorContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#logicalOrExpression. + def visitLogicalOrExpression(self, ctx:CASSParser.LogicalOrExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#logicalAndExpression. + def visitLogicalAndExpression(self, ctx:CASSParser.LogicalAndExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#equalityExpression. + def visitEqualityExpression(self, ctx:CASSParser.EqualityExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#relationalExpression. + def visitRelationalExpression(self, ctx:CASSParser.RelationalExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#additiveExpression. + def visitAdditiveExpression(self, ctx:CASSParser.AdditiveExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#multiplicativeExpression. + def visitMultiplicativeExpression(self, ctx:CASSParser.MultiplicativeExpressionContext): + return self.visitChildren(ctx) + + + # Visit a parse tree produced by CASSParser#operationExpression. + def visitOperationExpression(self, ctx:CASSParser.OperationExpressionContext): + return self.visitChildren(ctx) + + + +del CASSParser \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS_Driver.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS_Driver.py new file mode 100644 index 00000000000..67699a24def --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/CASS_Driver.py @@ -0,0 +1,64 @@ +import sys +import subprocess +from antlr4 import FileStream, CommonTokenStream +from CASSLexer import CASSLexer +from CASSParser import CASSParser +from MyCASSVisitor import MyCassVisitor +from CASSNode import assign_usage_links + +def drive_tree(input_file): + #if len(sys.argv) < 2: + #print("Usage: python driver.py ") + #sys.exit(1) + + #input_file = sys.argv[1] + + # 1) Lex & parse + input_stream = FileStream(input_file) + lexer = CASSLexer(input_stream) + token_stream = CommonTokenStream(lexer) + parser = CASSParser(token_stream) + + parse_tree = parser.prog() # or whatever your top rule is + + # 2) Transform to CASS + visitor = MyCassVisitor() + cass_root = visitor.visit(parse_tree) + assign_usage_links(cass_root) + + count = [] + for child in cass_root.children: + count.append(child.get_node_count()) + cass_strings = cass_root.to_cass_string() # Now returns a list + final_list = [] + + # **4) Print the results correctly** + + for i in range(len(cass_strings)): + child = cass_root.children[i] + + # 1) Node count + node_count = count[i] + + # 2) Source range + src_range_str = child.get_source_range_string() + + # 3) The original CAS body + cas_body = cass_strings[i] + + # 4) Combine them: "0,0,5,1 23 S#FS#1_2 ... rest ..." + # Note the order: range -> node_count -> CAS body + final_cas = f"{src_range_str}\t{node_count}\t{cas_body}" + final_list.append(final_cas) + + + return final_list + + + # 4) Create DOT & PNG + + + +if __name__ == "__main__": + input_file = "input_code_ez.c" + print(drive_tree(input_file)) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/DriverCASS.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/DriverCASS.py new file mode 100644 index 00000000000..59527f64c91 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/DriverCASS.py @@ -0,0 +1,73 @@ +import sys +import subprocess +from antlr4 import FileStream, CommonTokenStream +from CASSLexer import CASSLexer +from CASSParser import CASSParser +from MyCASSVisitor import MyCassVisitor +from CASSNode import assign_usage_links + +def drive_tree(): + if len(sys.argv) < 2: + print("Usage: python driver.py ") + sys.exit(1) + + input_file = sys.argv[1] + + # 1) Lex & parse + input_stream = FileStream(input_file) + lexer = CASSLexer(input_stream) + token_stream = CommonTokenStream(lexer) + parser = CASSParser(token_stream) + + parse_tree = parser.prog() # or whatever your top rule is + + # 2) Transform to CASS + visitor = MyCassVisitor() + cass_root = visitor.visit(parse_tree) + #assign_usage_links(cass_root) + + count = [] + for child in cass_root.children: + assign_usage_links(child) + count.append(child.get_node_count()) + + + for child in cass_root.children: + count.append(child.get_node_count()) + cass_strings = cass_root.to_cass_string() # Now returns a list + final_list = [] + + # **4) Print the results correctly** + + for i in range(len(cass_strings)): + child = cass_root.children[i] + + # 1) Node count + node_count = count[i] + + # 2) Source range + src_range_str = child.get_source_range_string() + + # 3) The original CAS body + cas_body = cass_strings[i] + + # 4) Combine them: "0,0,5,1 23 S#FS#1_2 ... rest ..." + # Note the order: range -> node_count -> CAS body + final_cas = f"{src_range_str}\t{node_count}\t{cas_body}" + final_list.append(final_cas) + + print(final_list) + + + # 4) Create DOT & PNG + dot_lines = cass_root.to_dot() # Call to_dot() without extra arguments + with open("cass.dot", "w") as f: + f.write("\n".join(dot_lines)) + + subprocess.run(["dot", "-Tpng", "cass.dot", "-o", "cass.png"], check=True) + print("PNG saved as cass.png") + + +if __name__ == "__main__": + + drive_tree() diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/Execution.ipynb b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/Execution.ipynb new file mode 100644 index 00000000000..1bedd566155 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/Execution.ipynb @@ -0,0 +1,446 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "import MICSAS.interface as misim\n", + "from CASS_Driver import drive_tree" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Compute GNN feature vectors for each function" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "['0,0,7,1\\t32\\tS#FS#1_0\\tI#compound_statement#{$$$$$$$$$$$}\\t11\\tI#expression_statement#$;\\t1\\tI#assignment_expression#$=$\\t2\\tVx\\tVthis\\tI#expression_statement#$;\\t1\\tVcass\\tI#expression_statement#$;\\t1\\tVlogi\\tI#expression_statement#$;\\t1\\tVwas\\tI#expression_statement#$;\\t1\\tVvery\\tI#expression_statement#$;\\t1\\tVhard\\tI#expression_statement#$;\\t1\\tVto\\tI#expression_statement#$;\\t1\\tVimplement\\tI#declaration#int$;\\t1\\tI#init_declarator#$=$\\t2\\tvtotal\\t-1\\t29\\tN25\\tI#expression_statement#$;\\t1\\tI#assignment_expression#$=$\\t2\\tVstring\\tI#binary_expression#$+$\\t2\\tVx\\tvtotal\\t22\\t-1\\tI#return_statement#return$;\\t1\\tVstring\\t']\n", + "SourceRange(start_line=0, start_column=0, end_line=7, end_column=1) [-4.1294155 -5.211907 3.0889378 5.3393927 -5.6841416 1.2497337\n", + " 2.4063818 -9.08663 2.2093687 1.892722 -1.1380143 1.1616006\n", + " -1.5419241 -0.20270327 -0.07288193 -3.4492426 -4.0413427 4.779633\n", + " -5.629128 -2.9557533 1.4416361 -2.5284693 1.2146845 4.0458913\n", + " -6.9593687 -2.7513788 3.2649064 3.2515032 4.074086 1.6168451\n", + " -1.8603535 0.88812 -3.513892 2.5080686 0.5179828 -1.248848\n", + " 1.1560155 -1.6043649 11.595149 6.441434 3.0664783 1.519422\n", + " 4.947104 4.967602 1.9220064 5.642183 -1.0840368 -2.3155382\n", + " -5.74603 0.59510493 6.7324905 -2.9115293 0.1455935 -3.4160588\n", + " -1.2186348 3.7370958 1.1361692 -5.390905 -2.1138291 2.8961957\n", + " -4.516396 3.8821197 4.369601 -4.262406 -5.8198633 -0.6802757\n", + " 3.0132234 -5.479684 3.283188 -0.25578684 2.431601 0.3447537\n", + " 0.38510352 3.028669 -7.568852 0.02665816 -1.3509308 2.4025087\n", + " -1.6505597 -5.4847302 -0.71817356 -2.939468 -0.6101805 -3.626529\n", + " 5.250762 -3.6420784 -3.227295 5.315017 -3.6513247 -0.9761998\n", + " -3.9514906 -4.2916794 -3.4346824 1.8359088 4.747256 2.0808563\n", + " 2.9665325 2.0699759 3.323561 1.0676523 0.31472018 1.4222972\n", + " -0.6805499 3.637668 0.08404966 0.8734891 0.6308584 -1.0322663\n", + " -6.1879883 -2.1322947 -2.051759 5.458273 -0.3508397 -0.430752\n", + " 1.4346448 4.4908223 -1.4062636 -5.8702455 -0.60570395 3.0688777\n", + " 7.723066 2.4687867 -2.4759264 -5.2423205 2.1638908 -3.9223175\n", + " -6.197274 -1.6294694 ]\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "line 2:8 token recognition error at: '''\n", + "line 2:14 missing ';' at 'cass'\n", + "line 2:19 missing ';' at 'logi'\n", + "line 2:24 missing ';' at 'was'\n", + "line 2:28 missing ';' at 'very'\n", + "line 2:33 missing ';' at 'hard'\n", + "line 2:38 missing ';' at 'to'\n", + "line 2:50 token recognition error at: '''\n", + "line 2:41 missing ';' at 'implement'\n", + "line 3:4 missing ';' at 'int'\n", + "line 5:4 missing ';' at 'return'\n", + "line 8:0 missing ';' at '}'\n" + ] + } + ], + "source": [ + "cass_manager = misim.CASSManager()\n", + "gnn_preprocessor = misim.GNNPreprocessor('MICSAS/data/datasets/poj/dataset-gnn/vocab.pkl')\n", + "gnn_runner = misim.GNNRunner('MICSAS/data/datasets/poj/dataset-gnn/vocab.pkl', 'MICSAS/data/models/poj/gnn/model.pt')\n", + "\n", + "# Compute GNN feature vectors for each function/loop in a source file.\n", + "cass_strs = drive_tree(input_file='test_codes/input_code_8.c')\n", + "#cass_strs = ['1,0,10,1\\t34\\tS#FS#1_1\\tI#compound_statement#{$}\\t1\\tI#if_statement#if$$$\\t3\\tI#condition_clause#($)\\t1\\tI#binary_expression#$<$\\t2\\tvn\\t-1\\t15\\tN0\\tI#compound_statement#{$}\\t1\\tI#return_statement#return$;\\t1\\tN-1\\tI#else_clause#else$\\t1\\tI#if_statement#if$$$\\t3\\tI#condition_clause#($)\\t1\\tI#binary_expression#$||$\\t2\\tI#binary_expression#$==$\\t2\\tvn\\t5\\t18\\tN0\\tI#binary_expression#$==$\\t2\\tvn\\t15\\t27\\tN1\\tI#compound_statement#{$}\\t1\\tI#return_statement#return$;\\t1\\tN1\\tI#else_clause#else$\\t1\\tI#compound_statement#{$}\\t1\\tI#return_statement#return$;\\t1\\tI#binary_expression#$*$\\t2\\tvn\\t18\\t32\\tI#call_expression#$$\\t2\\tFfactorial\\tI#argument_list#($)\\t1\\tI#binary_expression#$-$\\t2\\tvn\\t27\\t-1\\tN1\\t']\n", + "#cass_strs = cass_manager.extract_cass_strs_from_src_file('input_code_ez.c', extract_loops=True)\n", + "casses, src_ranges = cass_manager.load_casses_from_strs(cass_strs)\n", + "inputs = gnn_preprocessor.preprocess_casses_seperated(casses)\n", + "vectors = gnn_runner.compute_code_vector_batched(inputs)\n", + "print (cass_strs)\n", + "for i in range(len(src_ranges)):\n", + " print(src_ranges[i], vectors[i])\n", + "\n" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Compute code similarity between two source files.\n" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0.8808798\n" + ] + } + ], + "source": [ + "# Compute code similarity between two source files.\n", + "cass_strs_1 = drive_tree(input_file='test_codes/input_code_1.c')\n", + "cass_strs_2 = drive_tree(input_file='test_codes/input_code_2.c')\n", + "casses_1, _ = cass_manager.load_casses_from_strs(cass_strs_1)\n", + "casses_2, _ = cass_manager.load_casses_from_strs(cass_strs_2)\n", + "input_1 = gnn_preprocessor.preprocess_casses_combined(casses_1)\n", + "input_2 = gnn_preprocessor.preprocess_casses_combined(casses_2)\n", + "vectors = gnn_runner.compute_code_vector_batched([input_1, input_2])\n", + "from numpy.linalg import norm\n", + "similarity = (vectors[0] @ vectors[1].T) / (norm(vectors[0]) * norm(vectors[1]))\n", + "print(similarity)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "# Paths to the two code files\n", + "file_1_path = \"test_codes/input_code_1.c\" # Update with your actual file path\n", + "file_2_path = \"test_codes/input_code_2.c\" # Update with your actual file path\n", + "\n", + "# Read the content of both files\n", + "with open(file_1_path, \"r\") as f1:\n", + " code_snippet_1 = f1.read()\n", + "\n", + "with open(file_2_path, \"r\") as f2:\n", + " code_snippet_2 = f2.read()\n", + "\n", + "# Create figure with 1 row, 3 columns (Two code snippets + Similarity bar)\n", + "fig, axes = plt.subplots(1, 3, figsize=(15, 5))\n", + "\n", + "# Display Code Snippet 1\n", + "axes[0].text(0, 1, code_snippet_1, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[0].axis(\"off\") # Hide axes\n", + "axes[0].set_title(\"Code Snippet 1\")\n", + "\n", + "# Display Code Snippet 2\n", + "axes[1].text(0, 1, code_snippet_2, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[1].axis(\"off\") # Hide axes\n", + "axes[1].set_title(\"Code Snippet 2\")\n", + "\n", + "# Plot Similarity Score\n", + "axes[2].bar([\"Code Similarity\"], [similarity], color='blue', alpha=0.7)\n", + "axes[2].set_ylim(0, 1)\n", + "axes[2].set_ylabel(\"Similarity Score\")\n", + "axes[2].set_title(\"Code Similarity\")\n", + "axes[2].grid(axis=\"y\", linestyle=\"--\", alpha=0.6)\n", + "\n", + "# Adjust layout to fit text properly\n", + "plt.tight_layout()\n", + "plt.show()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0.8952268\n" + ] + } + ], + "source": [ + "# Compute code similarity between two source files.\n", + "cass_strs_3 = drive_tree(input_file='test_codes/input_code_3.c')\n", + "cass_strs_4 = drive_tree(input_file='test_codes/input_code_4.c')\n", + "casses_3, _ = cass_manager.load_casses_from_strs(cass_strs_3)\n", + "casses_4, _ = cass_manager.load_casses_from_strs(cass_strs_4)\n", + "input_3 = gnn_preprocessor.preprocess_casses_combined(casses_3)\n", + "input_4 = gnn_preprocessor.preprocess_casses_combined(casses_4)\n", + "vectors = gnn_runner.compute_code_vector_batched([input_3, input_4])\n", + "from numpy.linalg import norm\n", + "similarity = (vectors[0] @ vectors[1].T) / (norm(vectors[0]) * norm(vectors[1]))\n", + "print(similarity)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAABdEAAAHqCAYAAADrpwd3AAAAOnRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjEwLjAsIGh0dHBzOi8vbWF0cGxvdGxpYi5vcmcvlHJYcgAAAAlwSFlzAAAPYQAAD2EBqD+naQAAe7FJREFUeJzt3QeYE1XXwPGzu/TeqwtI70U6vAgoChY6iog0EQtFFAHBAqK8WCgvSBelqKAUUQQVC0XpHRUUBKRL7yCwsJvvOddvYpLNLEk2u9ny/z1PIJlMZu5MdvfOnDlzbpjD4XAIAAAAAAAAAACIJTz2JAAAAAAAAAAAoAiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDXhQrVky6du0qSVmjRo3MAwAABA/HAAAApD6h6v9XrlwpYWFh5v9gmTlzplnmgQMHEvTYQZev69H1AakBQXQkK/v27ZOnnnpKihcvLhkyZJBs2bJJ/fr1Zdy4cXL16lVJqmJiYuTDDz+U2rVrS65cuSRr1qxSunRp6dy5s6xfv15SghEjRsgXX3zh8/yTJ0+Whx56SIoUKWI63qQesAAAhBbHACnjGODw4cMybNgwqVWrluTMmVPy5MljTup/+OGHBG8nACD5of9PXr7++mt57bXXQt0MIEGkSZjFAsH31VdfmaBr+vTpTcdTsWJFiYqKktWrV8uAAQNk586d8t5770lS9Oyzz8rEiROlZcuW0rFjR0mTJo3s3r1bvvnmG3MwUKdOHb+X+d1330lSO4Fu166dtGrVyqf53377bbl06ZI5iT527FiCtw8AkHxxDJByjgEWLVpkjgF03i5dusjNmzdNkOGee+6R6dOnS7du3RKlzQCApC819P933nmnuRiQLl26oK27U6dO8sgjj5j9lpCKFi1q2p42bVq3ILpuN4F0pEQE0ZEs7N+/33QC+kd6+fLlUrBgQed7vXr1kr1795oONik6ceKETJo0SXr06BGrgx87dqycOnUqoOUGs5MNhR9//NGZhZ4lS5ZQNwcAkERxDJCyjgEaN24shw4dMhnolqefflqqVq0qQ4YMIYgOAEhV/X94eLjJsA+miIgI80goegFcM+31eCTYbQeSMsq5IFl455135PLly/LBBx+4dZ6WkiVLSt++fd3+qL/xxhtSokQJc/VV65u99NJLcv36dbfPORwOGT58uNx2222SKVMmc2KnV7O9OX/+vDz33HMSGRlplqnr1Ewq7Txu1fnrevSWM08aQM6XL1+s2mVr1qyRfv36Sd68eSVz5szSunXrWCfanjXNrFpqc+fONdtaoEAB89kWLVqYW6c9P6tX8bds2SL16tWTjBkzyu233y5TpkyJ1UbdZ0OHDjXbq9ut2z9w4EC3fanrvXLlisyaNcs896U8ix4M6XwAAMSFY4CUdQxQoUIFtwC60mXff//9cuTIEXOXGgAAqaX/91YT3eqrf/nlF2nYsKFpp657wYIFzoQ0LROjfXiZMmVilUTzVhPdk2b068Xr6tWrS/bs2c1xQ4MGDWTFihVe656PGjXKXACw9u9vv/0Wqya69v+ahW5tp/XQfaHfh2ble7p27ZpZv5bsAZI6MtGRLCxevNjc8qQne7544oknzMmc3lr8wgsvyIYNG+TNN9+U33//XT7//HPnfNppaAeqJ2762Lp1q9x7772mQ3H1999/m87r6NGj5o+7ZlCvXbtWBg8ebEqRaGcSV7BYzZ8/39yKph3grfTp08fUCdUTV+2YdPm9e/c2J8e38t///td0VC+++KKcPHnSfLZJkyayfft208lazp07Z7b54Ycflg4dOsi8efPkmWeeMVeTH3/8cTOPHhzoCbjeLvfkk09KuXLl5Ndff5X//e9/8scffzjrn3700Udmn2tpFp1PaecKAEB8cQyQOo4Bjh8/bvaPL/sIAJDypbb+35P21Q8++KDJxtdl6Jhi+nz27NkmsK93cT366KMycuRIs8160Vzrrvvq4sWL8v7775vjAM2Y14vYesGiadOmsnHjRnOHmKsZM2aYgLf29RpE1zrvnhcTdD/99ddf8v3335vjA4semzz22GPmwsjZs2fNZ12/Z22Lvg8keQ4gibtw4YJDf1Rbtmzp0/zbt2838z/xxBNu0/v372+mL1++3Lw+efKkI126dI4HHnjAERMT45zvpZdeMvN16dLFOe2NN95wZM6c2fHHH3+4LXPQoEGOiIgIx6FDh+JsU+fOnc0yc+bM6WjdurVj1KhRjt9//z3WfDNmzDDzNWnSxK1Nzz//vFnP+fPnndMaNmxoHpYVK1aYzxYuXNhx8eJF5/R58+aZ6ePGjXP7rE4bPXq0c9r169cdVatWdeTLl88RFRVlpn300UeO8PBwx6pVq9zaOWXKFPP5NWvWOKfp/nHdZ/6Iz2cBACkXxwAp/xhA7dmzx5EhQwZHp06dAl4GACDlSE39v9WH6/+effWcOXOc03bt2mWmad+8fv165/Rvv/3WTNfjCM9jiv3799seO9y8edP0/67OnTvnyJ8/v+Pxxx93TtNl6LKyZctm9p8r6z3Xdffq1ctM87R7924zffLkyW7TW7Ro4ShWrJjb9wEkVZRzQZKnVyWVr1dVdSALpbdCu9Kr0cqqm6a3POnVZs34ci0rold1PekVZL21STPDTp8+7Xxodld0dLT89NNPcbZJr9pOmDDB3C6tV8H79+9vMrruvvtuc2Xbk17ddW2TrlvXc/DgwVtuvw644rqv9Kq03v5m7ReLDmziesuUZp/pa81c01u8re3WdpYtW9Ztu++66y7zvuetXgAABBPHACn/GEAz/TTDTjPl33rrraAsEwCQvKXG/t+TjhummecWLduSI0cOswwt5WKxnv/555/iD62Zbo2xohnlmiGuJXFq1KhhsvM9tW3b1pSaC1Tp0qVNWzWT3qLr1IFWdeBVSr0iOaCcC5K8bNmymf99rZGpJ5k6OIfWDHOl9UG107FOQq3/S5Uq5TafdgzaUbras2ePqUdm12noSWdctD06+Ik+zpw5Y+qdau1R7TC0Y1y1apXb/HqrmCurPXpL1614bo92RrovPOuhFSpUyNQ98+zYlM6ro4Xrduvtb4FuNwAA8cExQMo+BtAghO4Drauq+0PbBQBAauz/PWnNds/AstYO1/rsntN8PU7wpOVvRo8eLbt27ZIbN244p2vg35O3af7Si/1aok6/By15oxcqdL2dOnWK97KBxEAQHcmiA9WTqh07dvj1uWBeydQrs/fcc48ZTMsb68TTF7lz5zY1RvWhA4booCBWJ2KxG0lbB+RITLrdlSpVkjFjxnh937MDBwAgmDgGSNnHAFqDdcmSJSYrzcpwBwAgNfb/nuyOB4J1nPDxxx+bgUBbtWolAwYMMIOd6rK1jvy+fftize86tkqg9OLB888/b/p9HfRV26CZ75plDyQHBNGRLOiAGu+9956sW7dO6tatG+e82hFph6dXjvVWJ8uJEyfM6NpWR2X9r/PpgCWWU6dOxbqKqwNk6cjgeutWMGmHoR2oDkwSVwfqD90ez8507969UrlyZbfpOuDHlStX3DLRdKAwpSNnW9v9888/m1vObnVAwu1XAICEwDFAyjwG0BN2vdVdB2bTQc0AAHBF/5+wFixYYPbBwoUL3fpxHdg8PuI6JtABRR944AETRNcSLpqdH9cArUBSQ010JAt69VdP9HTEbe0IPemV0nHjxpnnOsK28vxjbGVS6R9tpZ1h2rRpZfz48W5Xbb39EX/44YdN5/3tt9/Gek87Za0dZuf48ePmNmVPWott2bJlXm87i48PP/zQ7bY37Ry1g77vvvvc5tM2T5061a09+lpvV6tevbpzu7Ve27Rp02Kt5+rVq+YE3KLfj+4LAACCiWOAlHcMMHLkSBk1apTJQuvbt6/f2wkASPno/xOWldHuuh82bNhgtjk+rAv0dscFWrpF941eTNc2uNZ9B5I6MtGRLOhV4Dlz5kj79u3NlWWtpVWxYkXTCa1du9bU0tJbkVSVKlWkS5cu5qq1/uFu2LChbNy40dT70luVGjdubObTE0Ud3ENvV9Kr3Nrxbtu2zdQoy5Mnj9v69Q/8l19+aebT9egJpp48/vrrr+YEVeuHen7GcuTIEalVq5a5TVmzubQum9ZP++STT0yGlw5iYvfZQOjV3f/85z/SrVs3c7ChBwTaQest06709ri3337btF1vRZs7d65s377d7Dc9sLA6uHnz5snTTz9tBhCrX7++qV+qNdN0uh5Q6JV0pftEB2rRAxVdttZMcx3wxNPixYvN9iutg6b15oYPH25e621unllzAIDUiWOAlHUMoIOraWBE69Hq96m3crvSW+fz588ftH0CAEie6P8Tlm6XZqG3bt3aXGTYv3+/qdlevnx5k4EfKOti/LPPPitNmzaNFSjXdWl5G/3+9CK/lpEBkg0HkIz88ccfjh49ejiKFSvmSJcunSNr1qyO+vXrO8aPH++4du2ac74bN244hg0b5rj99tsdadOmdURGRjoGDx7sNo+Kjo428xUsWNCRMWNGR6NGjRw7duxwFC1a1NGlSxe3eS9dumSWUbJkSbPuPHnyOOrVq+cYNWqUIyoqyrbNFy9edIwbN87RtGlTx2233Wbao+2uW7euY9q0aY6YmBjnvDNmzNDLwI5Nmza5LWPFihVmuv5vadiwoXl4zvPJJ5+YdubLl89s0wMPPOA4ePCg2/L0cxUqVHBs3rzZtCNDhgxmmydMmBCr/bptb7/9tpk/ffr0jpw5czqqV69u9tuFCxec8+3atctx5513mnVqOzz3nyd9X+fz9tD9AACAK44BUsYxwNChQ237f8/tBAAgpff/dv289r2etI3at3vSz/fq1SvWMcX+/fttjx20DSNGjDDL1D6+WrVqjiVLlph9oNMsugxd1siRI2Ot13rP9fz95s2bjj59+jjy5s3rCAsLM+976tmzp5k+Z84c230IJEVh+k+oA/kA4m/lypXmCrte0W3Xrl2c8+pgJqdPn/Z7oBYAAJD0cAwAAACSCx1c9IMPPjBlbzJlyhTq5gA+oyY6AAAAAAAAgAR17do1U8qtbdu2BNCR7FATHQAAAAAAAECC0JrwOn6K1pM/c+YMA4sjWSKIDgAAAAAAACBB/Pbbb9KxY0czkOi7774rVatWDXWTAL9REx0AAAAAgCTop59+kpEjR8qWLVvk2LFj8vnnn0urVq1uOU5Cv379ZOfOnRIZGSmvvPKKdO3aNdHaDABASkRNdAAAAAAAkqArV65IlSpVZOLEiT7Nv3//fnnggQfMYMPbt2+X5557Tp544gn59ttvE7ytAACkZGSiAwAAAACQxIWFhd0yE/3FF1+Ur776Snbs2OGc9sgjj8j58+dl6dKlidRSAABSHmqiAwAAAACQAqxbt06aNGniNq1p06YmI93O9evXzcMSExMjZ8+eldy5c5vAPQAAKZnml1+6dEkKFSok4eHhwQ2if/HFF9K6dWuzEgROD0jmz58v7dq1k6Rgz549cuedd8off/whWbNmjfW+ZjzkyJFDZs6cGZL2pTZ6oKu3YGpNw5RAt6VatWrmFtNixYqZaadPn5by5cvL1q1b5bbbbgt42Tdv3pRu3bqZrBv9Gf3zzz+D2HIAFvr/4KD/R1zo/31H/w/Edvz4ccmfP7/bNH198eJFuXr1qmTMmDHWZ958800ZNmxYIrYSAICk5/Dhw3EemwYURL/vvvvMoCaB0pOw3r17y+XLlyUp0vbpAXnfvn1l7NixZpqeyGhduVOnTkmePHkkJRo8eLD06tXL6wm0tV/ik4nQqFEjqVixokyYMEESig6YoydmS5YsSbB1vPbaa7JgwQK3WyQTwhtvvCE3btxI0vsivvR3qXPnzjJ06FD54IMPAl6O/n5+/PHHsnDhQqlXr15Q2wjgX/T/9P+BoP/3D/2/7+j/geD1AzoQqeXChQtSpEgROXDggGTLls1M035As/M0S931Yro1PTo62m2ZdtN1mr7nbbrS5fsyPSIiwrTD23TPNtpNZ5vYJraJbWKb2CalF5o12cPufCheQfT06dNLgQIFJCXTHfrhhx/KiBEjJFOmTJLSHTp0SBYtWiT/+9//bOfRDB8knlv98qYUXbp0kZo1a8rIkSMlV65cAS3jr7/+Mn+XNEMWQMKh/0956P+THvp/39H/A7FpP33ixAm3afpag+HestCV/h7pw1POnDmdQXQAAFIqDc6rWyUO2Rd68WL16tVmgdbDWzaITv/kk0+kVKlSpsN96qmnnFcUrEwmzfLSUcat5WiGkr+3hTZs2NCcZOhBt9Z809vWLLo8zXTzbJdm5Sh9rtkv2j7N9mnQoIHJiHEdaEUPMHQUdN0WuyyfBx980Plar9Lrcjdv3mxe6xWMDh06mAOPZ599Vtq2bWtOQj2zbX7++WepVKmSZMiQQZo1axbrgEdv99bsLW1PhQoVZN68ebHaouudPn26GTAmS5YsZls+++wz857WtnvmmWfMwZS1DF2mJ12uricyMjLWezqau/Vd6XZ72xc6Anz//v0le/bsUrRoUbfsJ/0+9LM//vijGVXeWpa/t4VrBluJEiXMvtJ1vPzyy25t0GXOmjXL3NJrrUOzxiwfffSR1KhRw/zcaDv1NvqjR4+6rcP6WVm1apXJaNJ13X777eYWZF2Wvqe3Ou7cuTPOfRIfw4cPj/N3Q9uh39WoUaMkb9685rudNm2aX/vCFytWrJDatWubfaC/z+PHj3d7X5c5evRo+c9//iOZM2eWu+++22RqWvR3/NFHHzVBqOLFi8sPP/zgdT3681+wYEGTRRYo/RuTJg1DPAAJhf7/X/T/7vuC/j946P/9R/8PxFa3bl1ZtmyZ27Tvv//eTAcAAPHg8ENUVJTj2LFjjhkzZmh+fKz3V6xYYabfe++9jh07djjmz5/vCAsLcyxevNi8//fff5vPjx071pEpUybzXB9nzpzxpxmOihUrOtq2bevYvXu3Y+fOnY7x48c7Dh065Hy/YcOGjl69esVq16lTp8xrfT5mzBjHu+++a57PnTvXMXDgQEfTpk3N+7p9mTNndsybN89RvXp1r8vo0qWL44EHHnCuY//+/eb9TZs2mddFixZ1PP/8846FCxea6aNGjTLtLFOmjPMzOj1XrlyOr776yrF9+3azrnbt2jnfX758uWnHhx9+6Ni3b59jzpw5jgwZMjjWr1/vtj90OcWKFXO88847Zp8sW7bMPJSuN2/evI4ff/zR8eeffzqWLFni+Oyzz2Lt0xYtWjieeOIJr/v7woUL5ntq1qyZ2W5POi1jxoyO//73v44//vjD0alTJ0f+/PkdN27cMO/r96ufr1u3rqNbt27O711/Hny1efNms50zZ850HDhwwLF69Wrz/VnOnz9vlvnwww87mjRp4lzHpUuXnPPovvjkk0/MPtq2bZujQYMGjrvuusttPdb3fMcdd5jvf+/evY7Zs2ebdeqydJkvvPCC+R6tdei6g+ny5ctmuT169DA/y56GDh1q9nfv3r3N/n7xxRcd6dOnd/5s+rIvbkX3kf6s6e+q7gP9Gc2dO7f5XbHofipevLjZZ/pzX7hwYbNvLPpcfw/WrFnjWLVqlfkZ1c/o74onbetjjz3mCNTkyZMdOXLkCPjzAOJG/0//T/9P/2+h/wcSl/4O698ufVj9mD4/ePCgeX/QoEHm769F/+ZrXztgwADH77//7pg4caIjIiLCsXTpUp/XqX//dV36PwAAKd0FH/s9v4Lols8//zzOk2g9YLZUrlzZMWTIELf5rJPUQGXJksUcDNjx5SRaDyj0oc+vXr3q+OabbxzlypVza58GDQoUKODYsGFDQCfRukxdtuv69OTHotP79+/vfP3tt986wsPDHWfPnjWvGzVqZA6KXD3yyCOOp556ym2aLqdz585e94WeaNWsWfOW+7RKlSqxvidPLVu2tD2JLlmypPP11q1bTZv0AC6u78UfCxYsMAd/t/qB9vxe4vLll1+aIM+1a9ec06zvefr06baf05PYChUqOBJa3759bU+i9efTarf+vGibNegS6L7w1LVrV/Oz5kp/Fq1Ak9J1vvHGG87Xzz77rOPOO+90vs6ZM6dj0qRJztf63O4kWgNO//nPfwJqqwZjHnzwQUedOnUC+jwA39H/0/+7ov9PGPT/vqH/R2ph/X3yfFh/l/V/z78Z+pmqVas60qVLZy56af/mD4LoAIDU5IKP/V6C3P9YsmRJ53O9nfns2bNBXb7envzcc8/J4sWLpU6dOvLQQw9J+fLl/VqG3qLq+lwfOlq5q7Rp05pbmSdPnmzqNvrLWq7r+jzXobflWvRWa70tVW8N1/32yy+/yLp169xuo42KivJ6i6/eku5Nx44dTW1XXY9+Tm+5bdWqVazb8bVdrvvEX3qbtUXbrvR711uhg0HbresoW7as3HPPPeYWYr193Z+6odu2bZMhQ4aYW+jPnTsnN2/eNIMO6G3HnjUA7fZnUqGjBVttdt3fwaI/e7/++qspD2DRQc70Nnpfftd1/+rD9fdSb9u24+33zxeTJk2SPn36SO7cuW1vFweQeOj/3Zfruj76/8DQ/7uj//8H/T9SE/0b7jmwmitvJbL0M/q3DwAABI9fNdF95VmbMK5OPxDvvPOOORHSOpxaw7Jq1aqmXqvF8wTRc5RXO97a+eSTT8qCBQvMCYGrQNfhC9dlax1LrQFrPX777TeZMWOGz4N+aZDh4MGDMnToUHPSqCfVPXv2jDWf1lH13EZ/eKtHGczvXbdPT+o0IKB1W3W/1K9f32yTL/RE+d577zX1ObX+qx5U6gmY3XeX1AdRS+j9rbSesevPntaB1XqKcbUj0DboybfWd/WX/jyvWbPG/Ey8+uqrAa0bQPDQ/8cP/X9s9P/u6P//Qf8PAACAxBaSkXjSpUvn88mPnXLlypmHDiCmGVw6gJJmJ1knQJcvX3bOe/jw4YDXowfnmgXleeKq69DBpuK7Dj0xcX2uI8LqoGRW5s6ff/7plu0TCG2rZuvpQwd4+t///mey61xVq1bNnKAn5e9dP6+DyOmjRYsWZtCrffv2SZkyZW65jl27dpmB5d5++23n/g10IKtg/Pwmhvi0U3/2du/eHfDPnmal6aB/+jOlgwCqHTt22M6v71nz+UMHiNNAkQ5W6O/AaQASH/3/v+j//fs8/b/v6P8BAACAEGeia7bI8ePH5fz58+a1PteH6wmrL/TA/Pr167Jo0SJzC6feouwrnbdXr17y448/mgyrL774wpzMut4qWr16dVm+fLlp78WLF2XKlCkSH5q5pSfprnQdmzZtMrde67aMHTs2oGXryfk333xjMutefvlladu2rTMLSm891tvzRo0aJX/88YdZ3xtvvCEff/yxz8sfN26cfPrpp+bzug69Bd7bbbXNmjUzt457nnRFR0c7v2fdTv2+rNf6nr/f+08//SSHDh2Sa9eu+fX5r7/+2myLboOeOM+aNcucQBUpUiTWOrZs2WJOmnUd1vbofHr787Rp08zPi2YXTpw40a/2u65Dl7FhwwazDr3N2VPXrl1NRqH+fPjL2r9///23+Xm3XvvzexLXvvDF4MGDze/YoEGDzImw7nf9GdcAjK+0FIIGLfTnSrPFRo4caZslqO3Un8FA6W3nuo0AEgb9/7/o/+n/6f/jRv8PAAAASe1B9DZt2kjBggVN1ofS5/rQkzx/1KpVS55//nnp0aOHub1Wb7P1ucHh4ea2406dOknp0qXNcvTk89FHH3XOo9lpWgNUs64aN24srVu3lvjQGpy6LFcPP/ywqS2qt5LrCbVmRwVa33XAgAEmq0pvZ3Wtf3rXXXfJnDlzZPbs2ebEV29f37hxo1vmlS8nF3oio5lmujxdxwcffBBrvvvuu898F56362qGnfU9L1261NwKbb32N/tOt1NvG9cMwowZM8pHH33kV2bT559/bur7ValSxdyOrQEBXY4r/ZnSny996HvDhw8303W79cRbAwpap3PChAny+uuvSyD050mz+nSf6Tp0nd5ODLXOZyC3hVv7V0/49QTUer127Vq/lmO3L3yhP2P6fa9atcr8fOvvke5vf2oPawkBveVeMzkfe+wxr2UElAbTNDswPnVoNYMzmCUVALij//8X/T/9P/1/3Oj/AQAAkBKF6eiioW4EkoapU6fKZ599Jt99912om5LsFShQwNTrHD16dKibkuRpAKlv375ugTB/afBHg3E6IFpcA5gBAGKj/w8e+n/f0f8DSZfezaV3/Vy4cEGyZcsW6uYAAJAk+r0EGVgUyZPefquZXpcuXQp1U5I1rW2rt2LrLdGIm9ap1RIGHTp0iNdytJ6q1katXLmyyXQEAPiO/j846P99R/8PAACA5IZMdAAp6qRcAxietXIBAEDKRf8PBBeZ6ACA1OSij/1emkRtFQAkIK25CwAAUhf6fwAAACQ0yrkAAAAAAAAAAGCDIDoAAAAAAAAAACkxiF61alV57bXXQt0MAACQiOj/AQAAAACJKVkH0ZctWyb9+/cP+PPFihWTUaNGSWo3f/58KVWqlGTIkEHq1asnO3fuDHWTAACwRf8fHPT/AAAAAJAKgui5c+eWLFmyhLoZydovv/wiHTp0kO7du8uWLVskMjJSHnjgAbl+/XqomwYAgFf0//FH/w8AAAAAKTyI3qRJEwkLCzMPb7dzN2rUSHr06CFdunSRzJkzS9myZWXDhg1uGWj62YMHD8qAAQOcy1q5cqXPbXA4HPLqq6+ak07N4NJMrgkTJjjf12XpMk+fPu3Wrt69e5vn2u6GDRtK6dKlpVy5cjJu3DjJnj27OYGNjo6WxPL+++9LtWrVZNCgQVKhQgV577335OjRo/LNN9+4zadtOnLkiJw7dy7R2gYAgCv6/+Ch/wcAAACAFB5E19uPjx07Zk767HzyySfmpHXbtm3mRLdXr17O9zZt2mQ+f9ttt8mQIUPMc33orcy+WrhwobkVfPLkybJr1y6ZOnWq31lxerK6aNEiiYmJMdu0Zs0aWbt2rWmfL3T7dZ3eHqtWrfJpGZp9Vr9+fedrPZGvXLmybN682W2+w4cPm/34/PPP+7WNAAAEC/3/P+j/AQAAACBxpZFkKGfOnOb/NGnsm1+nTh3p1q2bed6zZ09p166d3Lx503wmb968ZnpERIRkzZpVChQo4HcbDhw4YNrRrFkzs0zNbvNXjRo1TBaaZoLp5ytWrChlypSRQ4cOmfbfytdffy03btzw+l7hwoV9asOpU6ckT548Jijw1FNPydatW81rnQ4AQFJC//8P+n8AAAAASFzJMojui5IlSzqf68muZntduHDB1FENhtatW5tMNL0d++677za3Zj/88MOSLl06n5eht4Fb/7s+v3r1qk+fL1q0qARLtmzZzPLSp0/v9X09yddb2AEASMro//1D/w8AAAAAKbSciy+8ZakF8ySwePHism/fPlPLVE9A+/TpIy1btnS+r/VQPemJvC98bWcwbufWrDyt26p1ZvUW7nz58pnXVrYeAADJCf0//T8AAAAABFuKzUT3hWaN6S3egcqUKZM0b97cPGrXri3t27eXa9eumWyyHDlymHkuX75sbo+26opqvdFgCcbt3NWrVze1WC2arffLL7+YQdMAAEiJ6P/p/wEAAAAgRWeiR0VFyfHjx81DT4D1JNV6Hcgt3999952cPHnSnPz6mimmPvroI/nggw/kt99+MwOLzZ07V0qVKuW8LVufa4aaDhhmDXSmtU6DSW+/1m3w9siYMaNPy+jevbsZfO2tt96SnTt3ypNPPmlOwO+7775Y82p2nQ7WBgBAYqP//xf9PwAAAAAkrmQXRF+7dq0ULFjQPPSkb/To0c7X/ho+fLjJvCpSpIg56fzpp598/mz27Nll2rRpZgAwzUK7dOmSGZzLNUtt0qRJMnbsWClUqJCsW7dO6tevL0lNlSpVzAn++++/L3fccYfJlluyZEms2qgarFCB7GcAAOKL/j+46P8BAAAAwHdhDkaLgg/0xFprvm7fvl0qVaoU6uYAAIBEQP8PAKnPxYsXzUVjveCsd1cBAJCS+drvJbtMdITG999/L48++ign0AAApCL0/wAAAABAJjoAAAAAAPh/ZKIDAFKTi2SiAwAAAAAAAAAQPwTRAQAAAAAAAABIiUH0jz/+WIoUKSLh4eHSqFGjkLVj5syZcu+999q+nyNHDjNPKI0dO1aKFSsW0jakJl988YWEhYVJavLcc88l2O9hQi5bDRo0SPr06RPv5fzwww9Svnx5SZcuXch/54GUrGrVqvLaa6+FtA2p8e88AAAAAKRWybYm+s2bN01w+sUXX5Tu3btLhgwZJFeuXInejuvXr0vx4sVl7ty58p///MfrPCdPnpSsWbNKxowZA1qHnqTPnz9f2rVrF3A7//77b7ly5YrkzZtXkioNOvbu3VsuX76cYOtYuXKlNG7cWE6dOiV58uRJ0J+Lc+fOSYECBSS10ED39u3bzT4OtkuXLsmNGzcS7Hf89OnT5vdY26//B0r/Bujv+ZQpU6RQoUIB/84DiNuZM2ckffr0kiVLloA+rxeVtb/p379/iv47nxh93oEDB+T222+XTZs2SY0aNRJkHQCAxEVNdABAanIxpddEP378uAkKN2vWzASrQhFAVwsWLJDMmTPbBtBVvnz5Qh5My5QpU5IOoKc0GtxJyoGV5EYvQiXk77gGl+655x6ZPHlyvJbz119/yd133y0lSpQI+e88kJLlzp074AB6sPB3HgAAAABSj2QXRNeMJ83MjoyMNK9r1aplXruWejh79qw88sgj5uqBPjp06GCyxTyzs/Rzq1atknr16plMds2k2r9/v1/t+eSTT+SBBx7w+l7JkiXNOvThrbSDZsK99NJL8uCDD5ogt2Zw7d271/m+9Vn10EMPOV/rPvCn5I31uVCWc1m+fLnZPiuY36JFC4mKijLv6b7R9nXr1s1cGLHa6/qdaoabBjk12KnBSf3O1q5dG2s9+rnp06eb718DLDr/Z5995vy+NSNPaRvs9olegTpy5IjJMvTX6tWrne0P1m3++/btM3dcjBgxQoIlOjpahg0bZn6PdD/deeed8vPPPzvf1+9Ep8+ePdvMowErz9IJ69evl8qVK5vfnfvvv1/Onz/vdV2aAan7MxDDhw/3+vPgSb/fW/186/txZcnrz6T+PsdHTEyMpEmTJl7LAGCvSZMmzr8J3sq56N+JHj16SJcuXcwF7rJly8qGDRvc/g7oZw8ePCgDBgxwLsufO2gS4u98IPTOmYYNGzovMuq+0QQD5Uufp31Ly5YtJX/+/ObveJUqVWTx4sWx1qOfefPNN03mvmZn6GP8+PHO4zE9dlI1a9a03Sd6N5z2A/o/AAAAACRHyS6IrgG9Y8eOycaNG83rpUuXmtcLFy50ztOrVy/ZsWOHqU+sj19//VWeffZZ2xIUzz//vOzcuVP++9//mvrq/tCTabvblzXIqG2L61aA999/35zwa5BYy1VobWaLflYfatq0ac7X1gUEX2gJGP3M66+/LoG47777TDDV20MDrL4GbNu2bSt169Z1fi/6XAOOqn379qaNWrddg+zWdrp+pydOnDAXG6zv84477jCBWy3z4emNN96Q6tWry9atW2XevHmSM2dOE3TXZWpAXen3ra91v3saM2aM2cfr1q3ze3/Vrl3bLHfGjBkS33JF2la9cKBBIN1vGhzSiz5230eFChV8Xr7uozlz5phguQZi9E6Kpk2buu3Pa9euyVdffWX2uQarNOiu+17pBRD9TvV70M9rO/WCjTd6Acifn1lX+rup+1N/RxKaXpA7evSoCSwFSvdZ2rRpg9ouAP/S0mb6NyGuv3d6MUz/Xm7bts387dFjAov+zdfP33bbbTJkyBBnf6N9RGL9nX/66adt/477c7G0U6dOJji+ZcsWcyzSqlUrcxyhfOnztIyVBr717/xvv/1m+uLWrVt7TSaYNGmS6Z/1uObbb781+9XueMw6bnGlfbHOr/8DAAAAQHKU7FImIyIizO3TGqxSmiHreju1ZsPqSZoO+KVBMfXWW2+Zk8sJEyaYDCpXmlmlQT6lJRj8oevSejlaTsYbq/5oXJlqmv2qmWCqa9euJpBscd0urf8eyG3jml2mn9NMtUBokP/q1ate39PsNV/3kz40IG/Vm9aMN4tmlutDvxvdV962UwPorjQrbuLEiSbQ7Tmoq2ZVa4ahKl26tHO6LtcqCaIldhKiPqwGUHU9+n0F4tChQ/Lee+/JBx98YLIoNTtfA92FCxc27+t3oUFru3X7Qn933nnnHfn8889N6RGlgRtdjwZTNIvfuvih82mwqUyZMvLqq6/K5s2bpVKlSiZYogEY/XnVbdVA/6effirBpvtAHxq8SWjWPtbsSn//FqiffvrJjH+g+wJAwtCLoiquOz7q1Klj/naqnj17movJemFSP2OVNdNjCe0XA+lX4/t3Xi9q29Vi96dslf6teuaZZ5z9nA5qbNHBjW/V5+nFAH1Y9M640aNHy/fffy9PPvmk27zad2t/4Cmu4zEAAAAASEmSXRD9VjSDSjOcNdBn0YCtBgT1vapVq7rN36BBg4DXZQWXNVAdKC354hoc0FI0SYkVWIwPPbHWCxX60IC3Bjg0UFu0aFGfl6HByVdeeUVWrFhhstKtLHZvg5DG5ztVmnXtrUxAYtDMSM3wf/vtt00WtucFGL3Y4PozE4g9e/aYn902bdq4LV+n/fnnn271fjWAbtGAkfXzqdnaevHINYikv3Ou5YgsCTHQqNKsfL0wo/T3W8vvWDWS9WdLMy81W1XLNigtI6Dza/BMffPNN24/K9bvsd1Fo7ho4Eh/Lp966imT0Q8gdDz7Ve0v9IK39kVJgQa09RFfGkDXu+m0BIv2q9rHugbSb0XLp2lft2TJEpM9rhca9O9kQvSrmiSgDwAAAABIrpJdOZdgCzSTTOkJuQYhPeut+8Mzm87hcEhSEoxyLkrvDtBM3fr165vnFStW9BpwtaP1bfWWcc0+12xo6/ZxK5gerO801F5++WWTOanlVrRUyrvvvitnzpxxvh+sci5KAyea1W49du/ebcoMWLxleialn08to2S1Xe+Y0KC+9frrr7828+j/1jR9X+ezXnuWYbIuEAQyAK/+bI8bN86UXdKfTwChk9T/dgWrnItmhutYFjoui16s1CQBLeviK82G1/5Y79bTMi36d1GPa1JavwoAAAAAwZDiMtF1gCuta661m60BtPQkU6dZg18Fi94urVlfWktU63MnFL11XDPEQiEY5VwsWqdcH3379jWBymXLlrllDOr+tNtODQzoQGZW6RYriO4vXYcK1f68lVKlSplgrAY15s6dK1OmTDGlabTsz8CBA52B4/iUc9F1aNa1Zh5ag875S7+3v/76y2R3WiWStG57fO7K8JdrVr4OWKeBM88sfde7HfR9vbPCLpNf26/70PUuFl9pOQV9aJkGDUbZjZMAIGmIq79JaMEq56LKlStnHlqaTi+kakkuHePClz5P+1Ute2OVlNNBSV0v2qaUfhUAAAAAgiHFZaJrtpTWPx08eLAJtOpDB+vU8iGe9dCDoVmzZiY72JMGnvWEVB+aAafBRn1+6tQpv9ehQT+9XVsz3rX2qD8Zdbo+Xa8OGKklL6w2+Vqywgo6env4Wmdd63zrd6D1y7W0xocffigXL16MFazUZWpJjkWLFpn26eCVFg1QalD5jz/+kDVr1ngtdeLPRZYFCxaYW9l1fZ60NrguW//3l2Yz6/7VGvDK2t/ebo+/VYBYb33XgKz+DOtFB80ctwLH3h6+lsfRQLcG5l944QUzSJ+WcNEsRi0NoIFkX3/utRyBXhDRDHYN/NtlYOt26P7U+r3+svaflhjQnwfrtevPRrBoNrmWLIhP/XXNJLXqAwMILte/ARqw1b+r1mt/6d/M7777zpQK099Zb9nXCfV3Xv922v0d9zWIrvtCB0z98ccfTb+q48BoyTrPfjWuPk/7VT220KQDHYi7c+fOAV0I1Qvq+rdPx9nQvt3b30DtY7QfCFWpNAAAAACIrxQXRFda8kMzxHXQRH1odpZmMSeEHj16mBNx62TaogHfggULmoeeVGrdUn1es2ZNv9ehgzfqCa6eeGsQ1arx7Atdn65Xa21rtq7VJm1fYtGgpAZatQa3DlA5cuRImTp1qtSrV89tPh0IVoPjuk/1M64Dhk6fPt0ELrS+/RNPPGG2RwMD/tJt13rjOjCpXgTQ9niyAiE6r790G/Vz1qB21v4eNWqUBEq3edKkSTJs2DAJlqFDh5qyMZrdrgNharkcDXz4WqdXM7Y1KKM/l9o+HWj0scce8zqv7k8NzARSDsDaf1omRS/CWK/Xrl3rNl+jRo1uGaTX93U+Ozowqv7sxYfWW/cnGAfAd/p7b/0N0DEPdBBM67W/hg8fbi5uFylSxPSrehEtlH/n/aX9n15Y79SpkwmGa9+p5cAeffRRn/u8MWPGmL/LOriobpP+DbcbKP1Wf/cmT55sSsNoDXrdn8HsVwEAAAAgKQhzJKVCoclUhw4dTPbXSy+9FOqmIAj0TgbNng+0ZAz+pX9eNEtRg/R68SSp0trpWl5BMzKtgUcDoTX/dTDWOXPmxGs5AJCSWPXX9W6yxCz7BQAIjCaB6V3cesE5W7ZsoW4OAABJot9LcTXRQ0GzvLQECZI/zSJevny5KXOC+NP67Vp2QMsrJWVaLmbGjBnxDnz36dNHHn/8cUmfPr3MmjVLOnbsGLQ2AkBy9f3335s7oAigA0Dq1bx5qFsAAEhJFi9O/HWSiQ4AQaQXDXTQVq1t7Ou4AQAAAEBKzkQniA4ASKpBdDLRASAE0qVL5/MgrwAAAAAAAEj6UuTAogAAAAAAAAAABANBdPisVatW0rVr11A3AwAArxo1aiS9e/e+5Xznz5+XsLAwWblypdt0fa3Trcfp06cloWm/OmLECNtxJbQdBw4ckNRi7NixUqxYMbdpS5culapVq5pxS+JDBw2/8847JXPmzNKtW7d4thQAAABAakI5F/hs5syZ5mQeAIDkTOvdWWMXuKpXr56ZvnbtWmnbtm2Ct+OXX36RxYsXy8GDB72+X7FiRdOevHnzSmrWrFkzeeWVV2T27NnSqVOngJfz3nvvyZ49e2T16tVSvHjxoLYRAAAAQMpGJjp8liNHDhN4AAAgOdMLwgUKFDBjGLjS1zrdM7ieUMaPHy9t2rSRLFmyeH0/TZo0pj0RERGS2nXp0kXefffdeC3jr7/+kipVqki1atU4ngEAAADgF4LoAXI4HPLqq69KZGSkZMiQQUqVKiUTJkyIdUu4663grreZv/baa9KwYUMpXbq0lCtXTsaNG2dO6B544AGJjo72uz1667PnbenB8sQTTzhvbY+rnMupU6fkyJEjCdIGAEDq9cEHH0j58uW9vqelUBo3bux8ff36dRNw1ZIdZcuWlQ0bNsQKTFt9WqD95qRJk6RkyZKSKVMmqVGjhqxYscLvZWhfP3/+fHnwwQdjvad9qWtZmWCUc9GM9uHDh0vfvn0lmOLaF9ax0CeffGKOk3Sk+6eeesqtLMsff/xh7gDQYyn9X0uueNOiRQvZvHmz7N27N+C26nr1+wcAAAAAfxFED9DChQtl1KhRMnnyZNm1a5dMnTrVNpPMztGjR2XRokXmpE5PpNesWWNuId+0aVNQ2qiBBW2Tt8fTTz/t83LGjBljTr71duq4PPTQQ+aiAgAAwVS3bl3ZvXu3XL58OdZ72mfq+xYN2OpF623btpk+qVevXrH6Xl1WfEqbDRs2TEaPHi07duwwAXu9AG4X/I2rlMuFCxdM4NlToUKFTL/7ww8/SHwv+H/33Xcm271o0aLy/fffy7333mvaand84M+xjK/7Quf74osvZPr06TJt2jT5+uuvne917NjRBNe3bt0qzzzzjEyZMsXrurT9+fLlkx9//DHg/XHt2jVJmzZtwJ8HAAAAkHqRjhMgzQrLmTOnCSxrVpPnIFi+0BNnzULX24r181r7tEyZMubks06dOvFuowbKH374Ya/v6Qmrr3RefaRPnz7ebQIAwF/aV2o/tGXLFnMX1+OPPy7PPvusGWxSg+j62qL9pzVoZM+ePaVdu3Zy8+ZNZwZy/vz549WfadD49ddfl5YtW5rXffr0kTlz5pjHoEGDfF6O1kHXLO2CBQvGei88PNyUcTl+/HhAbdS74DR7X2uAX7161QS33377bZMNrnR/6KCl8eXrvtA79ypUqGAelSpVMt+ZZuDrhQTNLv/tt9/Md6x3GyxZsiTW3QOWwoULB5yVr6VcNFnhscceC3BrAQAAAKRmBNED1Lp1a5OJruVY7r77bnNSrwFrz/qqcdFbl63/XZ/rCa8v9GTUGozs77//lvvuu89ZN/Wbb76RBg0aJFpdV5VQ5WQAAKmbBptr165tAq6ajfzpp5/KbbfdZgLNmlnueuFZS4tY9GK33u2lGd+5c+eOdzsuXbpkgrjPPfecvPDCC24Zzhoc9of29ZoVrQHzYNPychrgHjBggLkrzbOEib523U8JvS88v5OzZ8+a5/v27TPHLZpAYNHP2gXR/TlGcvXII4/I3LlzpXr16vLyyy/7/XkAAAAAIIgeoOLFi5uTv2XLlpngsWZfzZ492wSvrRN+T641QG91+7Uv9HboGzdumOd667pmmWmQwcrW0hNnfXijmVh2t0wDAJDUaMkWzWDWLPLnn39eli9fLjVr1jQB2rx58zrn81bz2td+1VdaksTzjjF/7vBSefLkkaioKHMRXOuJB1OPHj1MtrmWT/n8889NZr5mo+uxgdI73uxqzCtvZXPisy88v5NAvw8Nvrt+17763//+J507d5ZHH33UtFd/fgAAAADAHwTR40FPeps3b24eGrxu3769ycDSTKkcOXI4T0T1RFkdPnxYKleuHLT1a31Q1xNUPTl2zfYKVjkXAACSQhD9o48+MgOHvvXWW6a+twbSXeuhB4tVF9wz6zlr1qym79UgdHzLgmgpGqWlTLzVRY8PPR7QQUR1EHMde0Uvmg8dOlSaNGki/fr1MwOxxrecSzD2hR6z6ACrWqNey7kora3ujX4Xmrxwxx13+L0eLZmjD91+LelCEB0AAACAvwiiB0hP5DWDTE/e9VZsvU1Ya41aZVn0uQaqdcBQvZ1aBzrzd9Cx+NJSLvEt56Int6dOnTLPNXChJ7FWjVbNBrPKx6iuXbvKrFmzZP/+/QHViAcAwI5erNb+RftZLf+hpdQmTpxo7sLylV7Y1sfFixedmc3ap2kpNtf+UpevgXTNWtbBLjNmzOi8OD5kyBBTwkRrq+tdYCdOnDCDZuqAnRqk9ZX2oVpeZNWqVbGC6Fp+RvvbM2fOmNfaD+t2azuyZ8/u8zr0Anvbtm3NQwPQWiNdj0vuueeeeJdzCca+0NIttWrVMkFtHcRcA/tffvmlKdnjad26dWYf1K9fP+D26neq9eIBAAAAwF/BL8SZSuhJrHULs57Ya23QhQsXumWpT5o0ScaOHSuFChUyJ3/xOfG7Fa1LqiewwabZ81YG19KlS2XevHnO1/qeKw1MuGbhAwAQzH5Xs5WtzPOmTZuavtefTHQdy0T7L6sGtwaX9XWbNm1iZVnrwJwzZ840fbheJLboIKYauB85cqRpz0MPPWTGJ3G9O8xXTz75pKnv7qlv377OzGmlgWZ9rdMDVaJECdNuDaQHSzD2xccff2y+Rx1kffz48eYuOm90P3Xs2DFepW/0wr+vpfUAAAAAwFWYI9iFQpEq6Y+RZqJpzVU9mQYAAHHTO7zKli1rxlSpV69eqJuTZGkmvu4nHVj29ttvD3g5Oqio3hmoGe+UtQMAe3rHll681jujgvX3snnzoCwGAABj8WJJ9H6PTHQEhZ6QanmbwYMHh7opAAAkCzpIqpZBs8q2wDvNbte7++ITQFc6uKiOXaN3zNllvAMAAACAN2SiAwAAIFXQw95jx46ZevHeaq8DAMhEBwAkfYtDkInOwKIAAABIFcLCwkydewAAAADwB+VcAAAAAAAAAABISUH08PBwyZs3r/Ts2dPclgsAAICE0apVK+natWuomwEAAAAAIZMsy7kcPnxYvv/+e+nWrZs5qatVq1aomwQAAJAizZw505RBAQAAAIDUKllmohcuXFg6duxonh89ejTUzQEAAEixcuTIYQbaAQAAAIDUKlkG0VXatGnN/9HR0aFuCgAASCW0jNyrr74qkZGRkiFDBilVqpRMmDDB+f7KlStN1vbp06ed0xo1aiS9e/c2z1977TVp2LChlC5dWsqVKyfjxo0zAeoHHnggoGOaYsWKmXUmhCeeeMJsiz7iKudy6tQpOXLkSIK0AQAAAACSgmQbRFdp0qSR69evh7oZAAAglVi4cKGMGjVKJk+eLLt27ZKpU6dKlixZ/FqG3kW3aNEiiYmJkfnz58uaNWtk7dq1smnTpqC0ccSIEaZN3h5PP/20z8sZM2aMHDt2TJo1axbnfA899JC5qAAAAAAAKVWyrIluKVu2rCxZskTatWsn6dOnD3VzAABACnfgwAHJmTOnCSzrxXzNBPdXjRo1TBZ6tWrVzOcrVqwoZcqUkUOHDkmdOnXi3UYNlD/88MNe38uWLZvPy9F59cExFgAAAIDULllnon/wwQfy3XffSaZMmWT27Nmhbg4AAEjhWrdubUq6aDmWHj16yMcffyxRUVF+LUPLwFj/uz6/evWqT5+vUKGCM7NcA+/33Xef8/WqVaskV65cUrJkSa+PfPnySbBpORndJwAAAACQUiXrIPrAgQOlfPnysmHDBmnRokWomwMAAFK44sWLy759+0wtc83S7tOnj7Rs2dL5vtYP96RlW3zhayD666+/lu3bt5tHoUKF5P3333e+1iz3YJVzAQAAAACkgHIu69atM7VI9YQRAAAgMegdcM2bNzeP2rVrS/v27eXatWsmmzxHjhxmnsuXL0uePHnM88OHD0vlypWDtv6iRYs6n2tJmcKFC5ss82CXcwEAAAAApIAgut4+7e9gXgAAAIH66KOPzPFH3bp1JTw8XObOnSulSpVylmXR5xqo1gFDBwwYIJ988okpuZKYtJyLPuIjOjpaTp06ZZ7rIO5aaub48ePmdd68eSUiIsI5b9euXWXWrFmyf//+gGrEAwAAAEBSl2zLuejJnXI9iQMAAEhI2bNnl2nTppkBQDUL/dKlS7Jw4UK3LPVJkybJ2LFjTakVvWuufv36CTrQaaNGjYK+XM2eL1iwoHksXbpU5s2b53yt77nSrHvXLHwAAAAASGnCHMl0JKiffvpJGjZsaE5O9UQWAAAAiUsPI/Pnzy9dunSRkSNHhro5AIAguHjxorlofOHChaCVAWvePCiLAQDAWLxYEr3fS5blXDJmzGhqjzZt2lRq1aoV6uYAAACkSjqYqZa3GTx4cKibAgAAAAAJJlkG0Xfu3Ck5c+Y0DwAAAIRGtWrV5Pz586FuBgAAAAAkqGQZRC9evHiomwAAAAAAAAAASAWS7cCiAAAAAAAAAAAkNILoAAAAfvriiy8kLCws1M0AAKQCEydOlGLFikmGDBmkdu3asnHjxjjnHzt2rJQpU8aMJRYZGSnPP/+8GVMMAAAELlUH0fVAZNSoUaFuBgAASGbuu+8+OXbsWKibAQBI4ebOnSv9+vWToUOHytatW6VKlSrStGlTOXnypNf558yZI4MGDTLz//777/LBBx+YZbz00kuJ3nYAAFKSVB1EBwAACET69OmlQIECoW4GACCFGzNmjPTo0UO6desm5cuXlylTpkimTJlk+vTpXudfu3at1K9fXx599FGTNHbvvfdKhw4dbpm9DgAAUmgQXW+h1gOHRx55RLJkySJ58uSRzz77zLwXHR0tw4YNM7eu6Xt33nmn/Pzzz87P6sGEfv7gwYMyYMAA81wfK1eudFv+ggULnK9fe+01qVixolsbrGmff/65lCpVytxepwcsSpely/jkk0/Me9myZZOnnnpKYmJi/NrOCRMmSIkSJcyyixYtKi+//LLzvQMHDph1bN682Tmta9eu8uCDD5rnM2fONJkKesvfbbfdZg648ubNa15fvHjRbT36+siRI3L9+nW/2gcAQGqyevVq53HDrcq56PvaV9vRPluPJeycO3fO9M16XAMASH2ioqJky5Yt0qRJE+e08PBw83rdunVeP1OvXj3zGSto/ueff8rXX38t999/v+169BxQzwddH0r7H+thncfq/96mu07zNj0i4p+HiMNMt167T3f4MV1iTQ8P/2d6WFiMT9P1dVzT9XO+TGeb2Ca2iW1im6ITfZuC1T9ZD1+kkWTsjTfekJ49e8rrr79uTjJdp2vwWoPIGnjWYLve8rZnzx7JmjWrbNq0yeygmjVryuOPPy7PPPOM+VyuXLn8bsOJEydk9OjRZh358+eX7777zu19bYPWTdVb6R5++GFp3ry5M8h9K3rw06dPH7OMRo0amW3UW/j8oRcKfvrpJ3n22WdN6Rp93rJlS3MgpRcgXDMc9MLDihUrzLoAAEBseiFay7gsXbrUZAUmJK1hO2vWLNm/f79JAAAApC6nT5825616nulKX+/atcvrZzQDXT/3n//8RxwOh9y8eVOefvrpOMu5vPnmm+Zc0NPOnTtNUpp1rlykSBFzTnr27FnnPHpXlj70ovGlS5ec0zWhLXfu3OYcXOux16ljLbO4nD+fTWrW/M0lgCKybVsZuX49ndSp86tbG9avryTp00dJtWq7ndOioyPM9Bw5LkmFCn86p1+9mkG2bi0r+fKdk5IlDzunnz+fVXbuLCGRkSclMvK4c/qJE7lk794iUqLEEcmf/99tOny4gBw6VEDKlTtg1mHZuzdSTpzILVWr7pGMGf+tMc82sU1sE9vENiX+Nv36/6uIb/+kLl++LL4Ic2jPmgxpdlfnzp3NyaUr3QG6AzU7XAPnlkKFCplAsWvgWE9Ie/fuLf379/e6/Pnz50u7du3Ma80U08z0HTt2OOfRaRrA1x2v2eKuNBO9cePGsmrVKnMAozQrvFWrVl4PULzRzPr27dubHwLNZPekPwi33367uShQo0YNZ1abHjQtWbLEBN81+3z9+vWmLp7O/+mnn5p9cMcdd8jAgQPdtoUgOgAAvtEL5K1btzYBCjt6LBFXAFz7bH3PLhtd3yeIDgCp119//SWFCxc2JVrq1q3rnK7ncT/++KNs2LAh1mf0PFTP94YPH24u/O7du1f69u1rSsK8+uqrtpnornckaya6Bhlcz0O1T9MseM3gc+37rOmeWXye09u2/Wd6dLTeDB/mFnT5d7pmNcb4OD3i/7MX/52uzYqJiTBZiuHhjltOj4kJE4cj3Ha6Zj263nRmN51tYpvYJraJbUr8bfr/YiTx7p+sfk9jyRcuXPAaf00RmegNGjSINU0D2levXpU2bdq43Wat0/RWtmDT4LxnAN1VyZIlnc9z5szpdlXkVu6++26z7LJly8o999xjgvF6QKTZ9L7SMjDW/67PdX+40hP4uG4pBwAAt2Zl7FkqVKjgPB757bffZMSIEfLxxx+b1xqw0PesQc41S9A1U1AvhusDAJA6acnSiIgIc/ezK31tNy6HBso7deokTzzxhHldqVIluXLlijz55JOmNKgGDryN86EPT7pufbjy9nlr3rime94p/0/gJDb/pod5na4BH2935vs7XYM13thNZ5vYJraJbYprOtskQd0mz24n0P4prnlSVBA9R44ctu9pJrZePXcVSLkWi10t87jaoNKkcd/F/iT+67J//fVXU4JFMwo0yD1+/HhT0kWX660Wq68115PpDQgAACRp27dvdz7XMVG0fJpmEVoX3vUONusOuBdffNG8pyXX4nucAgBIedKlSyfVq1eXZcuWmTuarfM9fa13VHvz999/xwokWMEBzgEBAAhcsg6ie2MN8Kn1SrWcyq0OSrRGnF0A27UmzuHD/9bhSUzaRh04Rh8tWrQwt+Tt27dPypQp4wzge7Yzc+bMIWkrAACpnesdaErHZnEtxZIvXz7zUHpnmQbOPT8DAIClX79+0qVLF1O+s1atWjJ27FiTWW6Ny6ElTvWCrNY1VzoGl5YxrVatmrOci2an63RfM+0AAEBs3nPdkzENoA8YMEBeeOEFU9NcS7hoFrcOHupaz1zpSasOBHry5ElTS901i1uv+C9cuNDUyNFBW7788stE3xbNXhs3bpz8/PPPJnCudVGzZ89uCuYrfa7lXrRWu1q9erWplxcIvV1cM9u5bRwAAHtalu348eNy/vx581qf68PXwWj8oXegad+sxzEAgNRJx8jSsl9DhgyRqlWrmjuedHBra7DRQ4cOmQQyyyuvvGLOhfX/8uXLS/fu3c1YYVOnTg3hVgAAkPyluEx0NXToUEmbNq0ZcOXo0aNSsGBBueuuu5yZXxYdbEUHWNGgtNYldR1Uc/To0fLYY4+Zz+gVfK1FroO3JCatoa4DpOpJ9I0bN6Ry5cqyePFiyZgxo3MePRjSbdB2arZ6y5YtzS18/rJO/nVfAQAA73TMFdfjAavf1GMPz7FFbnXb/K0uXGvfrEF0K1ACAEidtHSLXfkWzwutWvZT+yR9AACA4AlzUBgNItKuXTuTxbBx48ZQNwUAAIiYW/dvv/12c2cdAACJ5eLFi+au5wsXLki2bNmCsszmzYOyGAAAjMWLJdH7vRSZiQ7/aBmb5cuXc5IOAEAScebMGfnll19k9uzZoW4KAAAAAKR6BNFhRm/XGq8AACBpyJ07t0RFRYW6GQAAAACAlDiwKAAAAAAAAAAAwUIQHQAAAAAAAAAAGwTRAQAAAAAAAAAIVhB92LBhkiFDBqlataqsX7/e348DAAAEPIZH3rx5pWfPnuJwOELdHAAAAABAKuF3EP2FF16Q7du3m0D666+/njCtAgAA8HD48GEZOXKkTJ48WTZt2hTq5gAAAAAAUgm/g+hZsmSRsmXLyt133y1Hjx5NmFYBAAB4KFy4sHTs2NE85xgEAAAAAJDka6KnTZtWoqOjg9saAACAWxx/KI5BAAAAAADJIoh+/fr14LYGAADgFtKkScMxCAAAAAAg6QfRtaTLgQMHZMuWLcFtEQAAwC2OQZYsWUIgHQAAAACQtIPobdq0kQ4dOkiNGjXMySwAAEBi+OCDD+S7776TTJkyyezZs0PdHAAAAABAChdwEH3lypXy8ccfy/vvvy9ff/11cFsFAABgY+DAgVK+fHnZsGGDtGjRItTNAQAAAACkcGkC/eD69eulSJEi0r179+C2CAAAIA7r1q2TqVOnmrvhAAAAAABIspnoWoc0S5YswW0NAADALURFRXEMAgAAAABI+kH06OhoiYiICG5rAAAAbnH8oTgGAQAAAAAk6SC6ZoBt3rxZChYsGPwWAQAA2FizZo35n2MQAAAAAECSrYk+YsQIefXVV81t1J9++mnCtAoAAMBDxowZ5dq1a9K0aVOpVatWqJsDAAAAAEgl/A6iP/3009KpUyeTAZYmTcDjkgIAAPhl586dkjNnTvMAAAAAACCx+B0Fz5Url3kAAAAkpuLFi4e6CQAAAACAVCjggUUBAAAAAAAAAEjpCKIDAAAAAAAAAGCDIDoAAEhVihUrJqNGjQp1MwAAAAAAyQRBdAAAAAAAAAAAbBBEBwAAyUZYWJhMnz5dHnnkEcmSJYvkyZNHPvvsM/NedHS0DBs2TCIjI817d955p/z8889uGej6+YMHD8qAAQPMc32sXLnSbfkLFixwvn7ttdekYsWKbm2wpn3++edSqlQpyZAhg9SvX9+8p8vSZXzyySfmvWzZsslTTz0lMTExfm3nhAkTpESJEmbZRYsWlZdfftn53oEDB8w6Nm/e7JzWtWtXefDBB83zmTNnSpUqVaR27dpy2223yZQpUyRv3rzm9cWLF93Wo6+PHDki169f96t9AAAAAJCaEEQHAADJyhtvvCHVq1eXrVu3yrx58yRnzpzO6XPmzDFB5O3bt8t//vMfadq0qVy6dMm8v2nTJjl27JgJLA8ZMsQ810e9evX8bsOJEydk9OjRJqD/yy+/SIcOHdze1zZ88cUX5v1p06bJ119/7fOyt2zZIn369DFt3L17t9mmAgUK+NU+vVCg6y1ZsqQpXfPTTz/JuXPnYrVjzJgx5qLDunXr/Fo+AAAAAKQmaULdAAAAAH9ohrlmkqvSpUub/69duybvvPOOyQ6/++67zbQRI0aYYPZXX31lMtc1G1tFRERI1qxZ/Q5Muzpz5ozMmjXLZIu7tsPy6quvSoUKFcyjUqVKJoBvZYrfimaaaxtbt25tMtk1E93KdPdV2bJlpXLlylKnTh2zvHLlyskdd9whhw4d8ms5AAAAAAAy0QEAQDLToEGDWNP27NkjV69elTZt2phSLtZDM8b//PPPoLehUKFCzgC6N5oBbtFM+bNnz/q8bL0IoMvWQHiXLl1MRrmVTe8rLQNj/e/6XPeRZ2kah8MhjRo18mv5AAAAAJCakIkOAACSlRw5cti+t2TJElOexFWuXLkCXpddLfO42qDSpHE/xNJAta902b/++qspwaI11jXQPX78eFO+Rper9dB9bacnf9oBAAAAAPgHQXQAAJDsWQN8ao3zxo0bxzlvunTp5ObNm7YB7MuXLztfHz58WEJB29ikSRPzaNGihRkUdN++fVKmTBlnAN+znZkzZw5JWwEAAAAgpaOcCwAASPY0gK510l944QWZP3++KeGiWdzPPPOM7NixI1aple+++05Onjxpaqm7ZnHrgKULFy6U6Oho2bVrl3z55ZeJvi06+Oe4cePk559/NoFzrb2ePXt2KVKkiHlfn2u5lwULFpjXq1evlrVr1wa0Lq0Zr5nt+j8AAAAAwDuC6AAAIEUYOnSo9OzZUwYOHOisJ65B8nz58rnNN3z4cLlw4YIJSmfMmNGUTbGMHj1a9u/fbz7Tr18/MyBpYtMa6jpAqtYpr1Klimzbtk0WL15s2mqZOnWqCbZrOydNmiQtW7YMaF1WNnvBggWD1n4AAAAASGnCHBTHBAAASJXatWsnhw4dko0bN4a6KQCAJOLixYvmrie94JwtW7agLLN586AsBgAAY/FiSfR+j5roAAAAqZCWsVm+fLkpfwMAAAAAsEcQHQAAIBUKDw+Xs2fPhroZAAAAAJDkURMdAAAAAAAAAAAbBNEBAAAAAAAAALBBEB0AANzSsGHDJEOGDFK1alVZv359qJsDAAAAAECiIYgOAABu6YUXXpDt27ebQPrrr78e6uYAAAAAAJBoCKIDAIBbypIli5QtW1buvvtuOXr0aKibAwAAAABAoiGIDgAAfJY2bVqJjo4OdTMAAAAAAEg0BNEBAIBfQfTr16+HuhkAAAAAACQagugAAMBnWtLlwIEDsmXLllA3BQAAAACAREEQHQAA+KxNmzbSoUMHqVGjhgmoAwAAAACQ0qUJdQMAAEDysXLlSvn444/l/fffl8aNG4e6OQAAAAAAJDiC6AAAwGfr16+XIkWKSPfu3UPdFAAAAAAAEgXlXAAAgM90UNEsWbKEuhkAAAAAACQagugAAMBn0dHREhEREepmAAAAAACQaAiiAwAAn0RFRcnmzZulYMGCoW4KAAAAAACJhiA6AAC4pREjRkjGjBll7dq10rdv31A3BwAAAACARMPAogAA4Jaefvpp6dSpk8lCT5OGwwcAAAAAQOrBWTAAALilXLlymQcAAAAAAKkN5VwAAAAAAAAAALBBEB0AAAAAAAAAABsE0QEAAAAAAAAAsEEQHQAAAAAAAAAAGwTRAQAAAAAAAACwQRAdAAAAAAAAAAAbBNEBAAAAAAAAALBBEB0AAAAAAAAAABsE0QEAAAAAAAAAsEEQHQAAAAAAAAAAGwTRAQAAAAAAAACwQRAdAAAAAAAAAAAbBNEBAAAAAAAAALBBEB0AAAAAAAAAABsE0QEAAAAACKKbN2/KDz/8IFOnTpVLly6ZaX/99Zdcvnw51E0DAAABSBPIhwAAAAAAQGwHDx6UZs2ayaFDh+T69etyzz33SNasWeXtt982r6dMmRLqJgIAAD+RiQ4AAAAAQJD07dtXatSoIefOnZOMGTM6p7du3VqWLVsW0rYBAIDAkIkOAAAAAECQrFq1StauXSvp0qVzm16sWDE5evRoyNoFAAACRyY6AAAAAABBEhMTI9HR0bGmHzlyxJR1AQAAyQ9BdAAAAAAAguTee++VsWPHOl+HhYWZAUWHDh0q999/f0jbBgAAAkMQHQAAAACAIBk1apSsWbNGypcvL9euXZNHH33UWcpFBxf118SJE83nM2TIILVr15aNGzfGOf/58+elV69eUrBgQUmfPr2ULl1avv7663hsEQAAoCY6AAAAAABBEhkZKT///LPMnTvX/K9Z6N27d5eOHTu6DTTqC11Gv379ZMqUKSaArhnuTZs2ld27d0u+fPlizR8VFSX33HOPeW/BggVSuHBhOXjwoOTIkSOIWwgAQOoT5nA4HKFuBAAAAAAAyd2NGzekbNmysmTJEilXrly8l6eB85o1a8qECROc9dY1SN+nTx8ZNGhQrPk12D5y5EjZtWuXpE2bNqB1Xrx4UbJnzy4XLlyQbNmySTA0bx6UxQAAYCxeLEHja79HORcAAAAAAIJAA9dawiUYNKt8y5Yt0qRJE+e08PBw83rdunVeP/Pll19K3bp1TTmX/PnzS8WKFWXEiBFeBzoFAAC+o5wLAAAAAABBogFsrX3+/vvvS5o0gZ9ynz592gS/NRjuSl9rprk3f/75pyxfvtyUjtE66Hv37pWePXuaDHkd2NSb69evm4drRp7SdVvBdx0cVQP4mgnvejO7Nd0zSO85PSLin+nR0ZrHFyYREe7z/zNd54vxcbou0OE2XZsVExMhYWExEh7uuOX0mJgwcTjCbaeHh0dLWJjccjrbxDaxTWwT25T422R1O/Htn/5ph28XmgmiAwAAAAAQJJs2bZJly5bJd999J5UqVZLMmTO7vb9w4cIEW7cGEbQe+nvvvScRERFSvXp1M6CplnixC6K/+eabMmzYsFjTd+7cKVmyZDHPc+XKJUWKFJEjR47I2bNnnfMUKFDAPA4cOCCXLl1yTteSM7lz55Y9e/aYzPw6daxlFpfz57NJzZq/uQVftm0rI9evp5M6dX51a8P69ZUkffooqVZtt1vQRafnyHFJKlT40zn96tUMsnVrWcmX75yULHnYOf38+ayyc2cJiYw8KZGRx53TT5zIJXv3FpESJY5I/vz/btPhwwXk0KECUq7cAbMOy969kXLiRG6pWnWPZMz4790GbBPbxDaxTWxT4m/Tr/+/ivj2T0rHLvEFNdEBAAAAAAiSbt26xfn+jBkzfC7nkilTJjNAaKtWrZzTu3TpIufPn5dFixbF+kzDhg1NSZkffvjBOe2bb76R+++/32Sbp0uXzqdMdA0yaDDCqg0b30y/tm2TTvZiSszIZJvYJraJbUpt2/TZZ8HLRNd+T4Pxt6qJTiY6AAAAAABB4muQ/FY04K2Z5JrVbgXRNUigr3v37u31M/Xr15c5c+aY+TRIoP744w8pWLCg1wC6Sp8+vXl40kx2fbiylult3rime94p/0/gJDb/pod5na4BH2935vs7XYM13thNZ5vYJraJbYprOtskQd0mz24n0P4prnk8MbAoAAAAAABBdurUKVm9erV56PNA9OvXT6ZNmyazZs2S33//XZ555hm5cuWKM9u9c+fOMnjwYOf8+r5mkPft29cEz7/66iszsKjWaQcAAIEjEx0AAAAAgCDRIHefPn3kww8/NBnhVpabBrzHjx9vSrT4qn379iYAP2TIEDl+/LhUrVpVli5d6hxs9NChQ27Zd1qG5dtvv5Xnn39eKleuLIULFzYB9RdffDEBthQAgNSDmugAAAAAAATJU089ZWqST5gwwZRXUZqN/uyzz8o999wjkydPlqRMa8Nmz579lrVh/dG8eVAWAwCAsXixJHq/RyY6AAAAAABB8tlnn5nBQBs1auScpgN7ZsyYUR5++OEkH0QHAACxURMdAAAAAIAg+fvvv53lVlzly5fPvAcAAJIfgugAAAAAAARJ3bp1ZejQoXLt2jXntKtXr8qwYcPMewAAIPmhnAsAAAAAAEEybtw4adq0qdx2221SpUoVM+3nn3+WDBkymEE/AQBA8kMQHQAAAACAIKlYsaLs2bNHZs+eLbt27TLTOnToIB07djR10QEAQPJDEB0AAAAAgCDKlCmT9OjRI9TNAAAAQUJNdAAAAAAAguTNN9+U6dOnx5qu095+++2QtAkAAMQPQXQAAAAAAIJk6tSpUrZs2VjTK1SoIFOmTAlJmwAAQPwQRAcAAAAAIEiOHz8uBQsWjDU9b968cuzYsZC0CQAAxA9BdAAAAAAAgiQyMlLWrFkTa7pOK1SoUEjaBAAA4oeBRQEAAAAACBIdUPS5556TGzduyF133WWmLVu2TAYOHCgvvPBCqJsHAAACQBAdAAAAAIAgGTBggJw5c0Z69uwpUVFRZlqGDBnkxRdflMGDB4e6eQAAIABhDofDEepGAAAAAACQkly+fFl+//13yZgxo5QqVUrSp08vycHFixcle/bscuHCBcmWLVtQltm8eVAWAwCAsXixJHq/R010AAAAAACCLEuWLFKzZk3JmjWr7Nu3T2JiYkLdJAAAECCC6AAAAAAAxNP06dNlzJgxbtOefPJJKV68uFSqVEkqVqwohw8fDln7AABA4AiiAwAAAAAQT++9957kzJnT+Xrp0qUyY8YM+fDDD2XTpk2SI0cOGTZsWEjbCAAAAsPAogAAAAAAxNOePXukRo0azteLFi2Sli1bSseOHc3rESNGSLdu3ULYQgAAECgy0QEAAAAAiKerV6+6DUi2du1aufPOO52vtazL8ePHQ9Q6AAAQHwTRAQAAAACIp6JFi8qWLVvM89OnT8vOnTulfv36zvc1gJ49e/YQthAAAASKci4AAAAAAMRTly5dpFevXiZ4vnz5cilbtqxUr17dLTNdBxcFAADJD0F0AAAAAADiaeDAgfL333/LwoULpUCBAjJ//ny399esWSMdOnQIWfsAAEDgwhwOhyMenwcAAAAAACnExYsXTdmZCxcuuNV4j4/mzYOyGAAAjMWLJdH7PWqiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAECQrVqwIdRMAAECQEUQHAAAAACBImjVrJiVKlJDhw4fL4cOHQ90cAAAQBATRAQAAAAAIkqNHj0rv3r1lwYIFUrx4cWnatKnMmzdPoqKiQt00AAAQIILoAAAAAAAESZ48eeT555+X7du3y4YNG6R06dLSs2dPKVSokDz77LPy888/h7qJAADATwTRAQAAAABIAHfccYcMHjzYZKZfvnxZpk+fLtWrV5cGDRrIzp07Q908AADgI4LoAAAAAAAE0Y0bN0w5l/vvv1+KFi0q3377rUyYMEFOnDghe/fuNdMeeuihUDcTAAD4KI2vMwIAAAAAgLj16dNHPvnkE3E4HNKpUyd55513pGLFis73M2fOLKNGjTLlXQAAQPJAEB0AAAAAgCD57bffZPz48dKmTRtJnz69bd30FStWJHrbAABAYCjnAgAAAABAkAwdOtSUavEMoN+8eVN++ukn8zxNmjTSsGHDELUQAAD4iyA6AAAAAABB0rhxYzl79mys6RcuXDDvAQCA5IcgOgAAAAAAQaK10MPCwmJNP3PmjKmHDgAAkh9qogMAAAAAEE9aA11pAL1r165u5Vyio6Pll19+kXr16oWwhQAAIFAE0QEAAAAAiKfs2bM7M9GzZs0qGTNmdL6XLl06qVOnjvTo0SOELQQAAIEiiA4AAAAAQDzNmDHD/F+sWDHp378/pVsAAEhBCKIDAAAAABAkQ4cODXUTAABAkBFEBwAAAAAgHu644w5ZtmyZ5MyZU6pVq+Z1YFHL1q1bE7VtAAAg/giiAwAAAAAQDy1btnQOJNqqVatQNwcAAAQZQXQAAAAAAIJQwiU6OloaN24slStXlhw5coS6WQAAIEjCg7UgAAAAAABSs4iICLn33nvl3LlzoW4KAAAIIoLoAAAAAAAEScWKFeXPP/8MdTMAAEAQEUQHAAAAACBIhg8fLv3795clS5bIsWPH5OLFi24PAACQ/FATHQAAAACAILn//vvN/y1atJCwsDDndIfDYV5r3XQAAJC8EEQHAAAAACBIVqxYEeomAACAICOIDgAAAABAkDRs2DDUTQAAAEFGEB0AAAAAgCD7+++/5dChQxIVFeU2vXLlyiFrEwAACAxBdAAAAAAAguTUqVPSrVs3+eabb7y+T010AACSn/BQNwAAAAAAgJTiueeek/Pnz8uGDRskY8aMsnTpUpk1a5aUKlVKvvzyy1A3DwAABIBMdAAAAAAAgmT58uWyaNEiqVGjhoSHh0vRokXlnnvukWzZssmbb74pDzzwQKibCAAA/EQmOgAAAAAAQXLlyhXJly+feZ4zZ05T3kVVqlRJtm7dGuLWAQCAQBBEBwAAAAAgSMqUKSO7d+82z6tUqSJTp06Vo0ePypQpU6RgwYKhbh4AAAgA5VwAAAAAAAiSvn37yrFjx8zzoUOHSrNmzWT27NmSLl06mTlzZqibBwAAAkAQHQAAAACAIHnsscecz6tXry4HDx6UXbt2SZEiRSRPnjwhbRsAAAgMQXQAAAAAABJIpkyZ5I477gh1MwAAQDwQRAcAAAAAIB769evn87xjxoxJ0LYAAIDgI4gOAAAAAEA8bNu2zaf5wsLCErwtAAAg+AiiAwAAAAAQDytWrAh1EwAAQAIKT8iFAwAAAAAAAACQnJGJDgAAAABAPLRp00Zmzpwp2bJlM8/jsnDhwkRrFwAACA6C6AAAAAAAxEP27Nmd9c71OQAASFkIogMAAAAAEA8zZszw+hwAAKQM1EQHAAAAAAAAAMAGmegAAAAAAATJmTNnZMiQIbJixQo5efKkxMTEuL1/9uzZkLUNAAAEhiA6AAAAAABB0qlTJ9m7d690795d8ufP76yVDgAAki+C6AAAAAAABMmqVatk9erVUqVKlVA3BQAABAk10QEAAAAACJKyZcvK1atXQ90MAAAQRATRAQAAAAAIkkmTJsnLL78sP/74o6mPfvHiRbcHAABIfijnAgAAAABAkOTIkcMEy++66y636Q6Hw9RHj46ODlnbAABAYAiiAwAAAAAQJB07dpS0adPKnDlzGFgUAIAUgiA6AAAAAABBsmPHDtm2bZuUKVMmKMubOHGijBw5Uo4fP24GKx0/frzUqlXrlp/79NNPpUOHDtKyZUv54osvgtIWAABSK2qiAwAAAAAQJDVq1JDDhw8HZVlz586Vfv36ydChQ2Xr1q0miN60aVM5efJknJ87cOCA9O/fXxo0aBCUdgAAkNoRRAcAAAAAIEj69Okjffv2lZkzZ8qWLVvkl19+cXv4Y8yYMdKjRw/p1q2blC9fXqZMmSKZMmWS6dOn235Ga65rSZlhw4ZJ8eLFg7BFAACAci4AAAAAAARJ+/btzf+PP/64c5rWRfd3YNGoqCgThB88eLBzWnh4uDRp0kTWrVtn+7nXX39d8uXLJ927d5dVq1bFa1sAAMA/CKIDAAAAABAk+/fvD8pyTp8+bQLuOjipK329a9cur59ZvXq1fPDBB7J9+3af13P9+nXzsFy8eNH8r+u2Av4a/NcAfkxMjLkYYLGme14Y8JweEfHP9OhovRk+TCIi3Of/Z7rOF+PjdF2gw226NismJkLCwmIkPNxxy+kxMXphI9x2enh4tLiOCWs3nW1im9gmtoltSvxtsrqd+PZP/7TDt4vbBNEBAAAAAAiSokWLhmS9ly5dkk6dOsm0adMkT548Pn/uzTffNKVfPO3cuVOyZMlinufKlUuKFCkiR44ckbNnzzrnKVCggHloDXZdvyUyMlJy584te/bskWvXrkmdOtYyi8v589mkZs3f3IIv27aVkevX00mdOr+6tWH9+kqSPn2UVKu22y3ootNz5LgkFSr86Zx+9WoG2bq1rOTLd05Klvy3Jv3581ll584SEhl5UiIjjzunnziRS/buLSIlShyR/Pn/3abDhwvIoUMFpFy5A2Ydlr17I+XEidxSteoeyZjxmst+YpvYJraJbWKbEnubfv3/VcS3f1KXL18WX4Q5XMP0AAAAAADAL19++aXcd999kjZtWvM8Li1atPC5nIvWP1+wYIG0atXKOb1Lly5y/vx5WbRokdv8mn1erVo1ibDSvk0W4T/ZfZp1t3v3bilRooRPmegaZNBgRLZs2YKS6de2bdLJXkyJGZlsE9vENrFNqW2bPvsseJno2u9pMP7ChQvOfs8bgugAAAAAAMSDnpAfP37c1CLX53b8qYmuateuLbVq1ZLx48eb1xok0Iy73r17y6BBg9zm1Yy6vXv3uk175ZVXTAbeuHHjpHTp0pIuXbpbrlODCdmzZ79lMMEfzZsHZTEAABiLF0vQ+NrvUc4FAAAAAIB4sDK+PZ/HV79+/UzmeY0aNUwwfezYsXLlyhXp1q2beb9z585SuHBhU5IlQ4YMUrFiRbfP58iRw/zvOR0AAPiHIDoAAAAAAElQ+/bt5dSpUzJkyBCT6V61alVZunSpc7DRQ4cOxZn5DgAAgoNyLgAAAAAAxNO6devkzJkz8uCDDzqnffjhhzJ06FCTPa51zbUsS/r06SUpo5wLACCpWxyCci5csgYAAAAAIJ5ef/112blzp/P1r7/+Kt27d5cmTZqY+uWLFy82ZVcAAEDyQxAdAAAAAIB42r59u9x9993O159++qkZGHTatGmmtvm7774r8+bNC2kbAQBAYAiiAwAAAAAQT+fOnXPWKlc//vij3Hfffc7XNWvWlMOHD4eodQAAID4IogMAAAAAEE8aQN+/f795HhUVJVu3bpU6deo437906ZKkTZs2hC0EAACBIogOAAAAAEA83X///ab2+apVq2Tw4MGSKVMmadCggfP9X375RUqUKBHSNgIAgMCkCfBzAAAAAADg/73xxhvSpk0badiwoWTJkkVmzZol6dKlc74/ffp0uffee0PaRgAAEBiC6AAAAAAAxFOePHnkp59+kgsXLpggekREhNv78+fPN9MBAEDyQxAdAAAAAIAgyZ49u9fpuXLlSvS2AACA4KAmOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAAAAAANgiiAwAAAAAAAABggyA6AAAAAAAAAAA2CKIDAAAAAAAAAGCDIDoAAAAAAAAAADYIogMAAAAAAAAAYIMgOgAAAAAASdTEiROlWLFikiFDBqldu7Zs3LjRdt5p06ZJgwYNJGfOnObRpEmTOOcHAAC+IYgOAAAAAEASNHfuXOnXr58MHTpUtm7dKlWqVJGmTZvKyZMnvc6/cuVK6dChg6xYsULWrVsnkZGRcu+998rRo0cTve0AAKQkYQ6HwxHqRgAAAAAAAHeaeV6zZk2ZMGGCeR0TE2MC43369JFBgwbd8vPR0dEmI10/37lzZ5/WefHiRcmePbtcuHBBsmXLJsHQvHlQFgMAgLF4sQSNr/1emuCtEgAAAAAABENUVJRs2bJFBg8e7JwWHh5uSrRolrkv/v77b7lx44bkypXLdp7r16+bh2swwQrA60OFhYWZdWsQ3zUPz5puzWc3PSLin+nR0XozfJhERLjP/890nS/Gx+m6QIfbdG1WTEyEhIXFSHi445bTY2LCxOEIt50eHh4tYWFyy+lsE9vENrFNbFPib5PV7cS3f/qnHe7z2CGIDgAAAABAEnP69GlzYp8/f3636fp6165dPi3jxRdflEKFCpnAu50333xThg0bFmv6zp07JUuWLOa5BuGLFCkiR44ckbNnzzrnKVCggHkcOHBALl265Jyu2fK5c+eWPXv2yLVr16ROHWuZxeX8+WxSs+ZvbsGXbdvKyPXr6aROnV/d2rB+fSVJnz5KqlXb7RZ00ek5clySChX+dE6/ejWDbN1aVvLlOyclSx52Tj9/Pqvs3FlCIiNPSmTkcef0Eydyyd69RaREiSOSP/+/23T4cAE5dKiAlCt3wKzDsndvpJw4kVuqVt0jGTNec9lPbBPbxDaxTWxTYm/Tr/+/ivj2T+ry5cviC8q5AAAAAACQxPz1119SuHBhWbt2rdStW9c5feDAgfLjjz/Khg0b4vz8W2+9Je+8846pk165cmW/MtE1yKDBCOu29vhm+rVtm3SyF1NiRibbxDaxTWxTatumzz4LXia69nsajKecCwAAAAAAyUyePHkkIiJCTpw44TZdX2t2XVxGjRplgug//PBDnAF0lT59evPwpOvWhysNPHjjOZ/ndM875f8JnMTm3/Qwr9M14OPtznx/p2uwxhu76WwT28Q2sU1xTWebJKjb5NntBNo/xTWPJ+9rAAAAAAAAIZMuXTqpXr26LFu2zDlNM+30tWtmuifNPn/jjTdk6dKlUqNGjURqLQAAKRuZ6AAAAAAAJEH9+vWTLl26mGB4rVq1ZOzYsXLlyhXp1q2beb9z586m5IvWNVdvv/22DBkyRObMmSPFihWT48f/qYWrtc2t+uYAAMB/BNEBAAAAAEiC2rdvL6dOnTKBcQ2IV61a1WSYW4ONHjp0yO0W9smTJ0tUVJS0a9fObTlDhw6V1157LdHbDwBASsHAogAAAAAAwDnAWvbs2W85wJo/mjcPymIAADAWL5ZE7/eoiQ4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAAAAAACADYLoAAAAAAAAAADYIIgOAAAAAAAAAIANgugAAAAAAAAAANggiA4AAAAAAAAAgA2C6AAAAAAAAAAA2CCIDgAAAABAEjVx4kQpVqyYZMiQQWrXri0bN26Mc/758+dL2bJlzfyVKlWSr7/+OtHaCgBASkUQHQAAAACAJGju3LnSr18/GTp0qGzdulWqVKkiTZs2lZMnT3qdf+3atdKhQwfp3r27bNu2TVq1amUeO3bsSPS2AwCQkoQ5HA5HqBsBAAAAAADcaeZ5zZo1ZcKECeZ1TEyMREZGSp8+fWTQoEGx5m/fvr1cuXJFlixZ4pxWp04dqVq1qkyZMsWndV68eFGyZ88uFy5ckGzZsgVlO5o3D8piAAAwFi+WoPG130sTvFUCAAAAAIBgiIqKki1btsjgwYOd08LDw6VJkyaybt06r5/R6Zq57koz17/44gvb9Vy/ft08LBpEUOfOnZPo6GjzPCwszKxbg/iueXjWdGs+u+kxMf9Mj47Wm+HDJCLCff5/potERMT4OD1CRBxu07VZMTEREhYWI+HhjltOj4kJE4cj3HZ6eHi0hIXJLaezTWwT28Q2sU2Jv03nzklQ+icriP7POuLOMyeIDgAAAABAEnP69Glzkp8/f3636fp6165dXj9z/Phxr/PrdDtvvvmmDBs2LNZ0rcMOAEBSlCtX8Jd56dIlk5FuhyA6AAAAAACplGa6u2avazbf2bNnJXfu3CZjD0Di0GxYLdd0+PDhoJVSAnBrmoGuAfRChQrFOR9BdAAAAAAAkpg8efJIRESEnDhxwm26vi5QoIDXz+h0f+ZX6dOnNw9XOXLkiFfbAQROA+gE0YHEFVcGuuWfojQAAAAAACDJSJcunVSvXl2WLVvmliWur+vWrev1MzrddX71/fff284PAAB8QyY6AAAAAABJkJZZ6dKli9SoUUNq1aolY8eOlStXrki3bt3M+507d5bChQubuuaqb9++0rBhQxk9erQ88MAD8umnn8rmzZvlvffeC/GWAACQvBFEBwAAAAAgCWrfvr2cOnVKhgwZYgYHrVq1qixdutQ5eOihQ4ckPPzfG8zr1asnc+bMkVdeeUVeeuklKVWqlHzxxRdSsWLFEG4FAF9oWaWhQ4fGKq8EIGkIc2j1dAAAAAAAAAAAEAs10QEAAAAAAAAAsEEQHQAAAAAAAAAAGwTRAQAAAAAAAACwQRAdAAAAAAAAcPHaa6+ZwXwTWlhYmBkAOD66du0qrVq1cr5u1KiRPPfcc8lmHwDJAUF0AAAAAAAAJEvHjx+XPn36SPHixSV9+vQSGRkpzZs3l2XLloW6aXLq1Cl55plnpEiRIqZtBQoUkKZNm8qaNWuc8xw7dkzuu+++eK1n3LhxMnPmTAm2/v37u+1Hz2A9kJqkCXUDAAAAAAAAAH8dOHBA6tevLzly5JCRI0dKpUqV5MaNG/Ltt99Kr169ZNeuXSFtX9u2bSUqKkpmzZplgvwnTpwwQekzZ84459HAenxlz55dgsnhcEh0dLRkyZLFPACQiQ4AAAAAAIBkqGfPnqYcysaNG03AunTp0lKhQgXp16+frF+/3jnfoUOHpGXLliYgnC1bNnn44YdNQNvVW2+9Jfnz55esWbNK9+7d5dq1a7HW9/7770u5cuUkQ4YMUrZsWZk0aZJt286fPy+rVq2St99+Wxo3bixFixaVWrVqyeDBg6VFixZey7noRQF9PW/ePGnQoIFkzJhRatasKX/88Yds2rRJatSoYbZBM9c1y93XDPGPPvrIfFa3TYP2jz76qJw8edL5/sqVK816v/nmG6levbrJml+9erVbORd9rhcDFi1aZObVh37urrvukt69e7utT9uWLl26JHE3ABAsBNEBAAAAAACQrJw9e1aWLl1qMs4zZ84c633NTlcxMTEmgK7z//jjj/L999/Ln3/+Ke3bt3fOq0FrDRKPGDFCNm/eLAULFowVIJ89e7YMGTJE/vvf/8rvv/9u5n311VdNYNkbK4tbA+TXr1/3a9uGDh0qr7zyimzdulXSpEljgt4DBw40ZVs0ML93717TFl9pdv4bb7whP//8s2mPBus18O5p0KBB5mKCbl/lypVjlXbRiw/NmjUzJWj0Ua9ePXniiSdkzpw5btv48ccfS+HChU2AHUgpKOcCAAAAAACAZEUDyVp2RDPC46LZ0L/++qvs37/f1EtXH374oclY1+xuzfQeO3asyT7Xhxo+fLj88MMPbtnoGtgePXq0tGnTxry+/fbb5bfffpOpU6dKly5dYq1Xg99ap7xHjx4yZcoUueOOO6Rhw4byyCOPxApQe9KAtdZOV3379pUOHTqY7dDSNUrb6U8N9Mcff9z5XMvKvPvuu2a7L1++7Fau5fXXX5d77rnH6zJ0Ps2M12C5awka3R+aia4Z6hpkV9o2DdJrtjqQUpCJDgAAAAAAgGRFA+i+0KxqDZ5bAXRVvnx5k6mu71nz1K5d2+1zdevWdT6/cuWK7Nu3zwSvrQxzfWiwXafb0RIzf/31l3z55Zcmg1vLn2gw/VYBcNcgu5aYUVrv3XWaazmWW9myZYsZbFUHONWSLhrMt8rcuNKSL/7S0jadOnWS6dOnm9eaPb9jxw6vme5AckYmOgAAAAAAAJKVUqVKmUznxBg8VDO21bRp02IF2yMiIm4ZZNbsbn1o+Rctf6JZ7XEFmdOmTet8bmVze07TMjW+0AsAmtWuDy1JkzdvXhM819c66Kkrb2VxfKHbpLXTjxw5IjNmzDBlXLQGPJCSkIkOAAAAAACAZCVXrlwmEDxx4kQTKPY2sKfSgUAPHz5sHhYtw6Lva0a6Nc+GDRvcPu86MKlmfhcqVMjUUi9ZsqTbQ8u6+EPX6a29CUUvMpw5c8bUOtfBSrX8jT9Z7K50sNDo6OhY0zVLXrPY9SKD1kd3LR8DpBQE0QEAAAAAAJDsaABdg7q1atWSzz77TPbs2WNKs2jNb6scS5MmTUyQt2PHjqbUyMaNG6Vz586mpIlVvkTrjms5Es2i/uOPP0ym+M6dO93WNWzYMHnzzTfNsnUerbOu848ZM8Zr2zRwrRnZOsjmL7/8Ymqyz58/X9555x0z0Gli0RIuGvweP368uQigpWV0kNFAFCtWzGzL7t275fTp02bAUtdsdA3Ua5md1q1bB3ELgKSBIDoAAAAAAACSHR0kUwPjjRs3lhdeeEEqVqxoyqboIJyTJ092lj7RQS9z5swpd955pwmq6+fmzp3rXE779u1NqZWBAwdK9erV5eDBg/LMM8+4rUuDxO+//74JnGtQXoPwWtvcLhNda6Zr6Zf//e9/Zr3aNl2HDjQ6YcIESSxavkXbqQF8zYLXQPeoUaMCWpa2vUyZMubigy53zZo1zvd08FMdTFX/1xI2QEoT5vB1JAYAAAAAAAAA8HDgwAEpUaKEbNq0yQyeCqQ0BNEBAAAAAAAA+E1Lumjpmv79+5uSNa7Z6UBKQjkXAAAAAAAAAH7ToHnBggVNBvqUKVNC3RwgwZCJDgAAAAAAAACADTLRAQAAAAAAAACwQRAdAAAAAAAAAAAbBNEBAAAAAAAAALBBEB0AAAAAAAAAABsE0QEAAAAAAAAAsEEQHQAAAAAAAAAAGwTRAQAAAAAAAACwQRAdAAAAAAAAAAAbBNEBAAAAAAAAABDv/g/+bbfxgURjrAAAAABJRU5ErkJggg==", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "# Paths to the two code files\n", + "file_1_path = \"test_codes/input_code_3.c\" # Update with your actual file path\n", + "file_2_path = \"test_codes/input_code_4.c\" # Update with your actual file path\n", + "\n", + "# Read the content of both files\n", + "with open(file_1_path, \"r\") as f1:\n", + " code_snippet_1 = f1.read()\n", + "\n", + "with open(file_2_path, \"r\") as f2:\n", + " code_snippet_2 = f2.read()\n", + "\n", + "# Create figure with 1 row, 3 columns (Two code snippets + Similarity bar)\n", + "fig, axes = plt.subplots(1, 3, figsize=(15, 5))\n", + "\n", + "# Display Code Snippet 1\n", + "axes[0].text(0, 1, code_snippet_1, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[0].axis(\"off\") # Hide axes\n", + "axes[0].set_title(\"Code Snippet 1\")\n", + "\n", + "# Display Code Snippet 2\n", + "axes[1].text(0, 1, code_snippet_2, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[1].axis(\"off\") # Hide axes\n", + "axes[1].set_title(\"Code Snippet 2\")\n", + "\n", + "# Plot Similarity Score\n", + "axes[2].bar([\"Code Similarity\"], [similarity], color='blue', alpha=0.7)\n", + "axes[2].set_ylim(0, 1)\n", + "axes[2].set_ylabel(\"Similarity Score\")\n", + "axes[2].set_title(\"Code Similarity\")\n", + "axes[2].grid(axis=\"y\", linestyle=\"--\", alpha=0.6)\n", + "\n", + "# Adjust layout to fit text properly\n", + "plt.tight_layout()\n", + "plt.show()\n" + ] + }, + { + "cell_type": "code", + "execution_count": 25, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0.7181637\n" + ] + } + ], + "source": [ + "cass_strs_5 = drive_tree(input_file='test_codes/input_code_5.c')\n", + "cass_strs_6 = drive_tree(input_file='test_codes/input_code_6.c')\n", + "casses_5, _ = cass_manager.load_casses_from_strs(cass_strs_5)\n", + "casses_6, _ = cass_manager.load_casses_from_strs(cass_strs_6)\n", + "input_5 = gnn_preprocessor.preprocess_casses_combined(casses_5)\n", + "input_6 = gnn_preprocessor.preprocess_casses_combined(casses_6)\n", + "vectors = gnn_runner.compute_code_vector_batched([input_5, input_6])\n", + "from numpy.linalg import norm\n", + "similarity = (vectors[0] @ vectors[1].T) / (norm(vectors[0]) * norm(vectors[1]))\n", + "print(similarity)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "# Paths to the two code files\n", + "file_1_path = \"test_codes/input_code_5.c\" # Update with your actual file path\n", + "file_2_path = \"test_codes/input_code_6.c\" # Update with your actual file path\n", + "\n", + "# Read the content of both files\n", + "with open(file_1_path, \"r\") as f1:\n", + " code_snippet_1 = f1.read()\n", + "\n", + "with open(file_2_path, \"r\") as f2:\n", + " code_snippet_2 = f2.read()\n", + "\n", + "# Create figure with 1 row, 3 columns (Two code snippets + Similarity bar)\n", + "fig, axes = plt.subplots(1, 3, figsize=(15, 5))\n", + "\n", + "# Display Code Snippet 1\n", + "axes[0].text(0, 1, code_snippet_1, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[0].axis(\"off\") # Hide axes\n", + "axes[0].set_title(\"Code Snippet 1\")\n", + "\n", + "# Display Code Snippet 2\n", + "axes[1].text(0, 1, code_snippet_2, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[1].axis(\"off\") # Hide axes\n", + "axes[1].set_title(\"Code Snippet 2\")\n", + "\n", + "# Plot Similarity Score\n", + "axes[2].bar([\"Code Similarity\"], [similarity], color='blue', alpha=0.7)\n", + "axes[2].set_ylim(0, 1)\n", + "axes[2].set_ylabel(\"Similarity Score\")\n", + "axes[2].set_title(\"Code Similarity\")\n", + "axes[2].grid(axis=\"y\", linestyle=\"--\", alpha=0.6)\n", + "\n", + "# Adjust layout to fit text properly\n", + "plt.tight_layout()\n", + "plt.show()" + ] + }, + { + "cell_type": "code", + "execution_count": 37, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "0.6534402\n" + ] + } + ], + "source": [ + "cass_strs_7 = drive_tree(input_file='test_codes/input_code_7.c')\n", + "cass_strs_8 = drive_tree(input_file='test_codes/input_code_8.c')\n", + "casses_7, _ = cass_manager.load_casses_from_strs(cass_strs_7)\n", + "casses_8, _ = cass_manager.load_casses_from_strs(cass_strs_8)\n", + "input_7 = gnn_preprocessor.preprocess_casses_combined(casses_7)\n", + "input_8 = gnn_preprocessor.preprocess_casses_combined(casses_8)\n", + "vectors = gnn_runner.compute_code_vector_batched([input_7, input_8])\n", + "from numpy.linalg import norm\n", + "similarity = (vectors[0] @ vectors[1].T) / (norm(vectors[0]) * norm(vectors[1]))\n", + "print(similarity)\n" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "# Paths to the two code files\n", + "file_1_path = \"test_codes/input_code_7.c\" # Update with your actual file path\n", + "file_2_path = \"test_codes/input_code_8.c\" # Update with your actual file path\n", + "\n", + "# Read the content of both files\n", + "with open(file_1_path, \"r\") as f1:\n", + " code_snippet_1 = f1.read()\n", + "\n", + "with open(file_2_path, \"r\") as f2:\n", + " code_snippet_2 = f2.read()\n", + "\n", + "# Create figure with 1 row, 3 columns (Two code snippets + Similarity bar)\n", + "fig, axes = plt.subplots(1, 3, figsize=(15, 5))\n", + "\n", + "# Display Code Snippet 1\n", + "axes[0].text(0, 1, code_snippet_1, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[0].axis(\"off\") # Hide axes\n", + "axes[0].set_title(\"Code Snippet 1\")\n", + "\n", + "# Display Code Snippet 2\n", + "axes[1].text(0, 1, code_snippet_2, fontsize=10, family='monospace', verticalalignment='top')\n", + "axes[1].axis(\"off\") # Hide axes\n", + "axes[1].set_title(\"Code Snippet 2\")\n", + "\n", + "# Plot Similarity Score\n", + "axes[2].bar([\"Code Similarity\"], [similarity], color='blue', alpha=0.7)\n", + "axes[2].set_ylim(0, 1)\n", + "axes[2].set_ylabel(\"Similarity Score\")\n", + "axes[2].set_title(\"Code Similarity\")\n", + "axes[2].grid(axis=\"y\", linestyle=\"--\", alpha=0.6)\n", + "\n", + "# Adjust layout to fit text properly\n", + "plt.tight_layout()\n", + "plt.show()" + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "MyPythonEnv", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.10" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/cass/cass.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/cass/cass.py new file mode 100755 index 00000000000..336b65596f4 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/cass/cass.py @@ -0,0 +1,357 @@ +'''MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +from enum import Enum + +from .config import cass_config as config + + +class NodeType(Enum): + Internal = 0, + NumLit = 1, + CharLit = 2, + StringLit = 3, + GlobalVar = 4, + GlobalFun = 5, + LocalVar = 6, + LocalFun = 7, + FunSig = 8, + Error = 9 + + +class CassNode: + def __init__(self, node_type, label='', children=[]): + self.node_type = node_type + self.children = children + self.prev_use = None + self.next_use = None + self.parent = None + self.child_id = 0 + + self.removed = False + + if len(label) == 0: + self.label = label + self.n = label + + elif node_type == NodeType.FunSig: + if config.fsig_mode == 0: + self.n = None + else: + self.n = label + + elif node_type == NodeType.Internal: + assert label[0] == '#' + p = label[1:].find('#') + assert p > 0 + p += 2 + self.annot = label[:p] + self.label = label[p:] + + if self.annot == '#compound_statement#': + if config.compound_mode == 0: + pass + elif config.compound_mode == 1: + self.removed = True + elif config.compound_mode == 2: + self.label = '{#}' + else: + raise Exception() + + if config.annot_mode == 0: + self.n = self.label + elif config.annot_mode == 1: + self.n = self.annot + self.label + elif config.annot_mode == 2: + if self.annot == '#parenthesized_expression#' or self.annot == '#argument_list#': + self.n = self.annot + self.label + else: + self.n = self.label + else: + raise Exception() + + else: + if node_type == NodeType.LocalVar or node_type == NodeType.LocalFun: + self.n = '$VAR' + + elif node_type == NodeType.GlobalVar: + if config.gvar_mode == 0: + self.n = label + elif config.gvar_mode == 1: + self.n = label + self.removed = True + elif config.gvar_mode == 2: + self.n = '$GVAR' + elif config.gvar_mode == 3: + self.n = '$VAR' + else: + raise Exception() + + elif node_type == NodeType.GlobalFun: + if config.gfun_mode == 0: + self.n = label + elif config.gfun_mode == 1: + self.n = label + self.removed = True + elif config.gfun_mode == 2: + self.n = '$GFUN' + elif config.gfun_mode == 3: + if config.gvar_mode == 3: + self.n = '$VAR' + else: + self.n = '$GVAR' + else: + raise Exception() + + else: + self.n = label + + self.features = [] + + +class CassTree: + def __init__(self, nodes, leaf_nodes): + self.nodes = nodes + self.leaf_nodes = leaf_nodes + if nodes[0].node_type == NodeType.FunSig: + self.fun_sig_node = nodes[0] + self.root = nodes[1] + else: + self.fun_sig_node = None + self.root = nodes[0] + self.leaf_ranges = self._compute_leaf_ranges() + + def _compute_leaf_ranges(self): + node2leaf_id = {} + leaf_ranges = {} + for i, node in enumerate(self.leaf_nodes): + node2leaf_id[node] = i + + def compute_leaf_ranges_rec(node): + if len(node.children) == 0: + x = node2leaf_id[node] + leaf_ranges[node] = (x, x + 1) + else: + for c in node.children: + compute_leaf_ranges_rec(c) + leaf_ranges[node] = ( + leaf_ranges[node.children[0]][0], leaf_ranges[node.children[-1]][1]) + + compute_leaf_ranges_rec(self.root) + return leaf_ranges + + def _get_context(self, node): + assert not node.removed + + p = node.parent + if p is None: + return None + if p.label != '$.$': + if p.removed: + return None + return (node.child_id, p.n) + else: + for i in range(*(self.leaf_ranges[p])): + l = self.leaf_nodes[i] + if l.node_type == NodeType.GlobalVar or l.node_type == NodeType.GlobalFun: + if l.removed: + return None + return l.n + return None + + def featurize(self): + for i, node in enumerate(self.leaf_nodes): + if node.removed: + continue + + node.features.append(node.n) + + p = node + for _ in range(3): + cid = p.child_id + p = p.parent + if p is None: + break + if p.removed: + continue + node.features.append((node.n, cid, p.n)) + + if i > 0: + sib = self.leaf_nodes[i - 1] + if not sib.removed: + node.features.append((sib.n, node.n)) + if i < len(self.leaf_nodes) - 1: + sib = self.leaf_nodes[i + 1] + if not sib.removed: + node.features.append((node.n, sib.n)) + + if node.prev_use is not None: + if not node.prev_use.removed: + prev_ctx = self._get_context(node.prev_use) + ctx = self._get_context(node) + if prev_ctx is not None and ctx is not None: + node.features.append((prev_ctx, ctx)) + if node.next_use is not None: + if not node.next_use.removed: + ctx = self._get_context(node) + next_ctx = self._get_context(node.next_use) + if ctx is not None and next_ctx is not None: + node.features.append((ctx, next_ctx)) + + features = [] + for n in self.leaf_nodes: + features += n.features + + if config.fsig_mode == 1 and self.fun_sig_node is not None: + features.append(self.fun_sig_node.n) + + return features + + +def load_file(file_name): + casses = [] + with open(file_name) as f: + for line in f: + cass, _ = deserialize(line) + if cass is not None: + casses.append(cass) + return casses + + +def deserialize(s): + tokens = s.strip().split('\t') + src_range = tuple(map(int, tokens[0].split(','))) + assert len(src_range) == 4 + cass = deserialize_from_tokens(tokens[1:]) + return cass, src_range + + +def deserialize_from_tokens(tokens): + num_tokens = len(tokens) + if num_tokens == 0: + return None + + num_nodes = int(tokens[0]) + + nodes = [] + leaf_nodes = [] + + i = 1 + + has_fun_sig = False + if tokens[i][0] == 'S': + has_fun_sig = True + fun_sig = tokens[i] + i += 1 + fun_sig = fun_sig[1:] + nodes.append(CassNode(NodeType.FunSig, fun_sig)) + + while i < num_tokens: + node_type_label = tokens[i] + i += 1 + node_type_str = node_type_label[0] + label = node_type_label[1:] + if node_type_str == 'I': + num_child = int(tokens[i]) + i += 1 + nodes.append( + CassNode(NodeType.Internal, label, [None] * num_child)) + elif node_type_str == 'N': + node = CassNode(NodeType.NumLit, label) + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'C': + node = CassNode(NodeType.CharLit, label) + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'S': + node = CassNode(NodeType.StringLit, label) + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'V': + node = CassNode(NodeType.GlobalVar, label) + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'F': + node = CassNode(NodeType.GlobalFun, label) + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'v': + prev_use = int(tokens[i]) + next_use = int(tokens[i + 1]) + i += 2 + node = CassNode(NodeType.LocalVar, label) + node.prev_use = prev_use + node.next_use = next_use + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'f': + prev_use = int(tokens[i]) + next_use = int(tokens[i + 1]) + i += 2 + node = CassNode(NodeType.LocalFun, label) + node.prev_use = prev_use + node.next_use = next_use + nodes.append(node) + leaf_nodes.append(node) + elif node_type_str == 'E': + node = CassNode(NodeType.Error) + nodes.append(node) + leaf_nodes.append(node) + else: + raise Exception() + + assert num_nodes == len(nodes) + + for n in nodes: + if n.node_type == NodeType.LocalVar or n.node_type == NodeType.LocalFun: + if n.prev_use >= 0: + n.prev_use = nodes[n.prev_use] + else: + n.prev_use = None + if n.next_use >= 0: + n.next_use = nodes[n.next_use] + else: + n.next_use = None + + if has_fun_sig: + tree_start = 1 + else: + tree_start = 0 + + root, rem_nodes = build_tree_rec(nodes[tree_start:]) + + assert root == nodes[tree_start] + assert len(rem_nodes) == 0 + + return CassTree(nodes, leaf_nodes) + + +def build_tree_rec(nodes): + node = nodes[0] + nodes = nodes[1:] + for i in range(len(node.children)): + child, nodes = build_tree_rec(nodes) + child.parent = node + child.child_id = i + node.children[i] = child + return node, nodes \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/cass/config.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/cass/config.py new file mode 100755 index 00000000000..e33b92f3a57 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/cass/config.py @@ -0,0 +1,31 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +from types import SimpleNamespace +cass_config = SimpleNamespace( +annot_mode=2, +compound_mode=2, +gvar_mode=3, +gfun_mode=1, +fsig_mode=1 +) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/poj/dataset-gnn/vocab.pkl b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/poj/dataset-gnn/vocab.pkl new file mode 100644 index 00000000000..840cf07b2cd Binary files /dev/null and b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/poj/dataset-gnn/vocab.pkl differ diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/split_gcj.pkl b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/split_gcj.pkl new file mode 100644 index 00000000000..8846e8cee0b Binary files /dev/null and b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/split_gcj.pkl differ diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/split_poj.pkl b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/split_poj.pkl new file mode 100644 index 00000000000..349d8ae33e9 Binary files /dev/null and b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/datasets/split_poj.pkl differ diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/models/poj/gnn/model.pt b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/models/poj/gnn/model.pt new file mode 100644 index 00000000000..557cdfec95e Binary files /dev/null and b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/data/models/poj/gnn/model.pt differ diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/README.md b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/README.md new file mode 100755 index 00000000000..f8d8041c1bd --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/README.md @@ -0,0 +1,37 @@ +# MISIM Interface + +## Setup + +Use this [Makefile](../Makefile). + +Vocabularies are available [here](https://www.dropbox.com/s/zilq32a4s9pygde/datasets.tar.xz). +Pre-trained models are available [here](https://www.dropbox.com/s/jlfp2oypzkc29q7/models.tar.xz). +Extract them into `../data/`. + +## Usage example: +```python +import misim.interface as misim + +cass_manager = misim.CASSManager() +gnn_preprocessor = misim.GNNPreprocessor('misim/data/datasets/poj/dataset-gnn/vocab.pkl') +gnn_runner = misim.GNNRunner('misim/data/datasets/poj/dataset-gnn/vocab.pkl', 'misim/data/models/poj/gnn/0/model.pt') + +# Compute GNN feature vectors for each function/loop in a source file. +cass_strs = cass_manager.extract_cass_strs_from_src_file('test.c', extract_loops=True) +casses, src_ranges = cass_manager.load_casses_from_strs(cass_strs) +inputs = gnn_preprocessor.preprocess_casses_seperated(casses) +vectors = gnn_runner.compute_code_vector_batched(inputs) +for i in range(len(src_ranges)): + print(src_ranges[i], vectors[i]) + +# Compute code similarity between two source files. +cass_strs_1 = cass_manager.extract_cass_strs_from_src_file('test1.c', extract_loops=False) +cass_strs_2 = cass_manager.extract_cass_strs_from_src_file('test2.c', extract_loops=False) +casses_1, _ = cass_manager.load_casses_from_strs(cass_strs_1) +casses_2, _ = cass_manager.load_casses_from_strs(cass_strs_2) +input_1 = gnn_preprocessor.preprocess_casses_combined(casses_1) +input_2 = gnn_preprocessor.preprocess_casses_combined(casses_2) +vectors = gnn_runner.compute_code_vector_batched([input1, input2]) +from numpy.linalg import norm +similarity = (vector[0] @ vector[1].T) / (norm(vector[0]) * norm(vector[1])) +``` diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/__init__.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/__init__.py new file mode 100755 index 00000000000..370caea5d6a --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/__init__.py @@ -0,0 +1,26 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +from .cass_manager import CASS, CASSManager, SourceRange +from .model_preprocessor import ModelPreprocessor, GNNPreprocessor +from .model_runner import ModelRunner, GNNRunner diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/cass_manager.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/cass_manager.py new file mode 100755 index 00000000000..ea9913dcb09 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/cass_manager.py @@ -0,0 +1,81 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +from pathlib import Path +import subprocess +from collections import namedtuple +from typing import Tuple, Union, List + +from ..cass import cass + + +CASS = cass.CassTree +SourceRange = namedtuple('SourceRange', ['start_line', 'start_column', 'end_line', 'end_column']) + + +class CASSManager: + def __init__(self, use_c_parser: bool = False) -> None: + cass_extractor: str = str( + Path(__file__).parent.parent / + 'cass-extractor' / 'build' / 'bin' / 'cass-extractor' + ) + self.extract_command = [cass_extractor] + if use_c_parser: + self.extract_command.append('-c') + + def extract_cass_strs_from_src_file(self, file_name: str, extract_loops: bool) -> List[str]: + """ + Extract CASSes from the given source file. Return a list of serialized CASS strings. + If extract_loops is True, each function and loop will be extracted as a CASS, otherwise only functions will be extracted. + """ + cmd = self.extract_command + ['-l'] if extract_loops \ + else self.extract_command + output = subprocess.check_output( + cmd + ['-f', file_name], encoding='utf-8') + return output.splitlines() + + def extract_cass_strs_from_src_text(self, src_text: Union[str, bytes], extract_loops: bool) -> List[str]: + """ + Extract CASSes from the given source text. Return a list of serialized CASS strings. + If extract_loops is True, each function and loop will be extracted as a CASS, otherwise only functions will be extracted. + """ + cmd = self.extract_command + ['-l'] if extract_loops \ + else self.extract_command + output = subprocess.check_output(cmd, input=src_text, encoding='utf-8') + return output.splitlines() + + @staticmethod + def load_cass_from_str(cass_str: str) -> Tuple[CASS, SourceRange]: + c, src_range = cass.deserialize(cass_str) + assert c + return c, SourceRange(*src_range) + + @staticmethod + def load_casses_from_strs(cass_strs: List[str]) -> Tuple[List[CASS], List[SourceRange]]: + casses = [] + src_ranges = [] + for cass_str in cass_strs: + c, rng = CASSManager.load_cass_from_str(cass_str) + casses.append(c) + src_ranges.append(rng) + return casses, src_ranges diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/model_preprocessor.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/model_preprocessor.py new file mode 100755 index 00000000000..d29cb2052ff --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/model_preprocessor.py @@ -0,0 +1,101 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import pickle +import numpy as np +from typing import List, Tuple, Dict, Union, cast, Generic, TypeVar +from abc import ABC, abstractmethod + +from ..cass import cass +from .cass_manager import CASS + + +T = TypeVar('T') + + +class ModelPreprocessor(ABC, Generic[T]): + @abstractmethod + def preprocess_cass(self, cass: CASS) -> T: + pass + + @abstractmethod + def preprocess_casses_combined(self, casses: List[CASS]) -> T: + """ + Convert multiple CASSes into one instace of model input. + """ + pass + + @abstractmethod + def preprocess_casses_seperated(self, casses: List[CASS]) -> List[T]: + """ + Convert each CASS into one instace of model input. + """ + pass + + +class GNNPreprocessor(ModelPreprocessor[Tuple[np.ndarray, np.ndarray]]): + def __init__(self, vocab: Union[str, Dict[str, int]]) -> None: + if isinstance(vocab, str): + with open(vocab, 'rb') as f: + self.vocab: Dict[str, int] = pickle.load(f) + else: + self.vocab = vocab + + def preprocess_cass(self, cass: CASS) -> Tuple[np.ndarray, np.ndarray]: + """ + Build a graph from one CASS. + """ + nodes = [] + edges = [] + build_graph(cass.root, nodes, edges) + if cass.fun_sig_node is not None and cass.fun_sig_node.n is not None: + nodes.append(cass.fun_sig_node.n) + return np.array([self.vocab.get(t, 0) for t in nodes]), np.array(edges).T + + def preprocess_casses_combined(self, casses: List[CASS]) -> Tuple[np.ndarray, np.ndarray]: + """ + Build a graph from a list of CASSes. + """ + nodes = [] + edges = [] + for cass in casses: + build_graph(cass.root, nodes, edges) + if cass.fun_sig_node is not None and cass.fun_sig_node.n is not None: + nodes.append(cass.fun_sig_node.n) + return np.array([self.vocab.get(t, 0) for t in nodes]), np.array(edges).T + + def preprocess_casses_seperated(self, casses: List[CASS]) -> List[Tuple[np.ndarray, np.ndarray]]: + """ + Build a list of graphs from a list of CASSes. + """ + return [self.preprocess_cass(c) for c in casses] + + +def build_graph(node: cass.CassNode, nodes: List[str], edges: List[Tuple[int, int]]): + node_id = len(nodes) + nodes.append(cast(str, node.n)) + last_id = node_id + for c in node.children: + edges.append((node_id, last_id + 1)) + last_id = build_graph(c, nodes, edges) + return last_id diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/model_runner.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/model_runner.py new file mode 100755 index 00000000000..6356425ee09 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/interface/model_runner.py @@ -0,0 +1,90 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import pickle +import numpy as np +from abc import ABC, abstractmethod +from typing import Iterable, Tuple, Dict, Generic, TypeVar, Union +import torch + +from ..models.gnn_model import GNNModel + + +T = TypeVar('T') + + +class ModelRunner(ABC, Generic[T]): + @abstractmethod + def compute_code_vector(self, preprocessed_cass: T) -> np.ndarray: + """ + Compute a code vector for preprocessed CASS. + Return a 1D array with shape (vector_size,). + """ + pass + + @abstractmethod + def compute_code_vector_batched(self, preprocessed_cass_batch: Iterable[T]) -> np.ndarray: + """ + Compute code vectors for a batch of preprocessed CASS. + Return a 2D array with shape (batch_size, vector_size). + """ + pass + + +class GNNRunner(ModelRunner[Tuple[np.ndarray, np.ndarray]]): + def __init__(self, vocab: Union[str, Dict[str, int]], model_path: str, output_size: int = 128, + node_emb_size: int = 128, num_layers: int = 3, device: str = 'cpu') -> None: + if isinstance(vocab, str): + with open(vocab, 'rb') as f: + self.vocab: Dict[str, int] = pickle.load(f) + else: + self.vocab = vocab + self.device = torch.device(device) + self.model = GNNModel(node_emb_size, len(self.vocab), + output_size, num_layers) + self.model.load_state_dict(torch.load( + model_path, map_location=self.device)) + + def compute_code_vector(self, preprocessed_cass: Tuple[np.ndarray, np.ndarray]) -> np.ndarray: + return np.squeeze(self.compute_code_vector_batched([preprocessed_cass]), axis=0) + + def compute_code_vector_batched(self, preprocessed_cass_batch: Iterable[Tuple[np.ndarray, np.ndarray]]) -> np.ndarray: + num_prev_nodes = 0 + nodes_batch = [] + edges_batch = [] + indices_batch = [] + for i, (nodes, edges) in enumerate(preprocessed_cass_batch): + num_nodes = nodes.shape[0] + nodes_batch.append(torch.from_numpy(nodes)) + edges_batch.append(torch.from_numpy(edges) + num_prev_nodes) + num_prev_nodes += num_nodes + indices_batch.append(torch.full((num_nodes,), i, dtype=torch.long)) + + batched_nodes = torch.cat(nodes_batch).to(self.device) + batched_edges = torch.cat(edges_batch, dim=1).to(self.device) + batched_indices = torch.cat(indices_batch).to(self.device) + + with torch.no_grad(): + v: torch.Tensor = self.model(batched_nodes, batched_edges, batched_indices) + + return v.detach().cpu().numpy() diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/bof_model.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/bof_model.py new file mode 100755 index 00000000000..132c623ce40 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/bof_model.py @@ -0,0 +1,42 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +from torch_scatter import scatter_mean + + +class BagOfFeaturesModel(nn.Module): + def __init__(self, feature_emb_size, feature_vocab_size, output_size): + super().__init__() + self.feature_emb = nn.Sequential( + nn.Embedding(feature_vocab_size, feature_emb_size), + nn.Dropout(0.5) + ) + self.out = nn.Sequential( + nn.Linear(feature_emb_size, output_size) + ) + + def forward(self, features, indices): + feature_emb = self.feature_emb(features) + return self.out(scatter_mean(feature_emb, indices, dim=0)) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/c2s_model.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/c2s_model.py new file mode 100755 index 00000000000..b8eb7bde3ff --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/c2s_model.py @@ -0,0 +1,75 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +from torch.nn.utils.rnn import PackedSequence +from torch_scatter import scatter_add +from torch_scatter.composite import scatter_softmax + + +class C2SModel(nn.Module): + def __init__(self, emb_size, subtoken_vocab_size, node_vocab_size, rnn_size, decoder_size, output_size): + super().__init__() + self.subtoken_emb = nn.Embedding(subtoken_vocab_size, emb_size) + self.node_emb = nn.Embedding(node_vocab_size, emb_size) + self.path_rnn = nn.LSTM(emb_size, rnn_size // 2, bidirectional=True, batch_first=True) + + self.emb_dropout = nn.Dropout(0.25) + + self.fc = nn.Sequential( + nn.Linear(emb_size * 2 + rnn_size, + decoder_size, bias=False), + nn.Tanh() + ) + + self.a = nn.Parameter(torch.empty(decoder_size, dtype=torch.float)) + nn.init.uniform_(self.a) + + self.out = nn.Linear(decoder_size, output_size) + + def forward(self, ll_subtokens, ll_indices, rl_subtokens, rl_indices, paths, indices): + ll_emb = scatter_add(self.subtoken_emb(ll_subtokens), ll_indices, dim=0) + rl_emb = scatter_add(self.subtoken_emb(rl_subtokens), rl_indices, dim=0) + + _, (h, _) = self.path_rnn( + PackedSequence( + self.node_emb(paths.data), + paths.batch_sizes, + paths.sorted_indices, + paths.unsorted_indices + ) + ) # (2, batch_context_num, rnn_size // 2) + path_nodes_aggregation = torch.cat((h[0], h[1]), dim=1) # (batch_context_num, rnn_size) + + context_emb = torch.cat((ll_emb, path_nodes_aggregation, rl_emb), dim=1) + context_emb = self.emb_dropout(context_emb) + + context_emb = self.fc(context_emb) # (batch_context_num, decoder_size) + + attn_score = torch.matmul(context_emb, self.a) + attn_weight = scatter_softmax(attn_score, indices, dim=0) + weighted_context = context_emb * attn_weight.unsqueeze(1) + v = scatter_add(weighted_context, indices, dim=0) + + return self.out(v) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/c2v_model.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/c2v_model.py new file mode 100755 index 00000000000..ad036b3ab62 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/c2v_model.py @@ -0,0 +1,61 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +from torch_scatter import scatter_add +from torch_scatter.composite import scatter_softmax + + +class C2VModel(nn.Module): + def __init__(self, leaf_emb_size, leaf_vocab_size, path_emb_size, path_vocab_size, code_vec_size, output_size): + super().__init__() + self.leaf_emb = nn.Embedding(leaf_vocab_size, leaf_emb_size) + self.path_emb = nn.Embedding(path_vocab_size, path_emb_size) + self.emb_dropout = nn.Dropout(0.25) + + self.fc = nn.Sequential( + nn.Linear(leaf_emb_size * 2 + path_emb_size, + code_vec_size, bias=False), + nn.Tanh() + ) + + self.a = nn.Parameter(torch.empty(code_vec_size, dtype=torch.float)) + nn.init.uniform_(self.a) + + self.out = nn.Linear(code_vec_size, output_size) + + def forward(self, contexts, indices): + context_emb = torch.cat( + (self.leaf_emb(contexts[:, 0]), self.path_emb(contexts[:, 1]), self.leaf_emb(contexts[:, 2])), + dim=1 + ) + context_emb = self.emb_dropout(context_emb) + context_emb = self.fc(context_emb) + + attn_score = torch.matmul(context_emb, self.a) + attn_weight = scatter_softmax(attn_score, indices, dim=0) + weighted_context = context_emb * attn_weight.unsqueeze(1) + v = scatter_add(weighted_context, indices, dim=0) + + return self.out(v) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/circle_loss.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/circle_loss.py new file mode 100755 index 00000000000..398a6352f60 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/circle_loss.py @@ -0,0 +1,42 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +import torch.nn.functional as F + + +class CircleLoss(nn.Module): + def __init__(self, gamma, m): + super().__init__() + self.gamma = gamma + self.m = m + + def forward(self, s_p, s_n): + alpha_p = torch.clamp_min(1 + self.m - s_p, 0) + alpha_n = torch.clamp_min(self.m + s_n, 0) + delta_p = 1 - self.m + delta_n = self.m + logit_p = (-self.gamma) * alpha_p * (s_p - delta_p) + logit_n = self.gamma * alpha_n * (s_n - delta_n) + return F.softplus(torch.logsumexp(logit_p, dim=0) + torch.logsumexp(logit_n, dim=0)) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/gnn_model.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/gnn_model.py new file mode 100755 index 00000000000..d5cbf54c25f --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/gnn_model.py @@ -0,0 +1,71 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +from torch_scatter import scatter_max, scatter_mean + + +class GNNModel(nn.Module): + def __init__(self, node_emb_size, node_vocab_size, output_size, num_layers): + super().__init__() + self.num_layers = num_layers + self.node_emb = nn.Sequential( + nn.Embedding(node_vocab_size, node_emb_size), + nn.Dropout(0.5) + ) + self.gnn_layers = nn.ModuleList( + [RGCNLayer(node_emb_size) for _ in range(num_layers)]) + self.out = nn.Sequential( + nn.Linear(node_emb_size * 2, output_size) + ) + + def forward(self, nodes, edges, indices): + h = self.node_emb(nodes) + for i in range(self.num_layers): + h = self.gnn_layers[i](h, edges) + + v = torch.cat( + ( + scatter_mean(h, indices, dim=0), + scatter_max(h, indices, dim=0)[0] + ), + dim=1 + ) + + return self.out(v) + + +class RGCNLayer(nn.Module): + def __init__(self, node_emb_size): + super().__init__() + self.W0 = nn.Linear(node_emb_size, node_emb_size, bias=False) + self.W1 = nn.Linear(node_emb_size, node_emb_size, bias=False) + self.W2 = nn.Linear(node_emb_size, node_emb_size, bias=False) + + def forward(self, nodes, edges): + nbr_msg = torch.cat( + (self.W1(nodes[edges[0]]), self.W2(nodes[edges[1]])), dim=0) + msg = scatter_mean(nbr_msg, torch.cat( + (edges[1], edges[0])), dim=0, dim_size=nodes.size(0)) + return torch.relu(self.W0(nodes) + msg) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/ncc_model.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/ncc_model.py new file mode 100755 index 00000000000..5af72a0399f --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/ncc_model.py @@ -0,0 +1,57 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +from torch.nn.utils.rnn import PackedSequence + + +class NCCModel(nn.Module): + def __init__(self, inst2vec_emb, rnn_size, dense_size, output_size, use_i2v_emb): + super().__init__() + if use_i2v_emb: + self.emb = nn.Embedding.from_pretrained(inst2vec_emb, freeze=True) + else: + self.emb = nn.Embedding(inst2vec_emb.size(0), inst2vec_emb.size(1)) + self.rnn = nn.LSTM(self.emb.embedding_dim, rnn_size, num_layers=2) + self.batch_norm = nn.BatchNorm1d(rnn_size) + self.out = nn.Sequential( + nn.Linear(rnn_size, dense_size), + nn.ReLU(), + nn.Linear(dense_size, output_size) + ) + + def forward(self, seqs): + seqs = PackedSequence( + self.emb(seqs.data), + seqs.batch_sizes, + seqs.sorted_indices, + seqs.unsorted_indices + ) + + _, (hn, _) = self.rnn(seqs) + x = hn[-1] + + x = self.batch_norm(x) + + return self.out(x) diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/sbt_model.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/sbt_model.py new file mode 100755 index 00000000000..b380514358b --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MICSAS/models/sbt_model.py @@ -0,0 +1,65 @@ +''' +MIT License + +Copyright (c) 2021 Intel Labs + +Permission is hereby granted, free of charge, to any person obtaining a copy +of this software and associated documentation files (the "Software"), to deal +in the Software without restriction, including without limitation the rights +to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +copies of the Software, and to permit persons to whom the Software is +furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in all +copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +SOFTWARE. +''' +import torch +import torch.nn as nn +from torch.nn.utils.rnn import PackedSequence +from torch_scatter import scatter_max, scatter_mean + + +class SBTModel(nn.Module): + def __init__(self, token_emb_size, token_vocab_size, hidden_size, output_size): + super().__init__() + self.hidden_size = hidden_size + self.token_emb = nn.Sequential( + nn.Embedding(token_vocab_size, token_emb_size), + nn.Dropout(0.5) + ) + self.rnn = nn.GRU(token_emb_size, hidden_size, bidirectional=True) + self.proj = nn.Sequential( + nn.Linear(hidden_size * 4, output_size) + ) + + def forward(self, seqs, indices): + seqs = PackedSequence( + self.token_emb(seqs.data), + seqs.batch_sizes, + seqs.sorted_indices, + seqs.unsorted_indices + ) + + _, hn = self.rnn(seqs) + + h = torch.cat((hn[0], hn[1]), dim=1) + + v = torch.cat( + ( + scatter_mean(h, indices, dim=0), + scatter_max(h, indices, dim=0)[0] + ), + dim=1 + ) + + v = self.proj(v) + + return v diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MyCASSVisitor.py b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MyCASSVisitor.py new file mode 100644 index 00000000000..cf2bceaf45b --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/MyCASSVisitor.py @@ -0,0 +1,845 @@ +from CASSVisitor import CASSVisitor +from CASSParser import CASSParser +from CASSNode import CassNode + +""" +Original implementation by IntelLabs: https://github.com/IntelLabs/MICSAS/tree/master + +Cass strings in the original implementation come with a configuration setup. This is the setup (most likely) used in this project and decides on whether a node gets a label. + + annot_mode : Annotations + compound_mode: Compound Statements + gvar_mode : Global Variable + gfun_mode : Global Function + fsig_mode : Function Signatures + +Unfortunately we don't know for sure how labels influence the Cass string as changing the configuration inside the original implementation cloned from GitHub has no effect on the final output string. + +A Node according to the original implementation consists of 3 parts: + 1) Node type : + -> I : Internal + -> N / C / S : Number / Char / String literal + -> F : Global function + -> f : Local function + -> V : Global variable + -> v : Local variable + -> S : Function signature + -> E : Error * not implemented + + 2) Annotation : #compound_statement#, #init_declarator# etc. + 3) Labels : #VAR, #GVAR, #GFUN, {#} ? + +In this project we focused on replicating the Cass string building logic of the original implementation to be able to then vectorize it and calculate a similarity score. Our nodes include node types, annotations, observed suffixes representing a binary operation or the number of immediate children nodes using dollar signs "$=$", {$$$} as well as variable/function names. While building the string, nodes are seperated using '\t' followed with either number of immediate children nodes like '2' or the number (id) of the node that a local variable/function has been previously used it, and the node number where it will next be used it (current node numer). + +Here's an example of a Cass string for a simple program obtained from the original implementation showing the structure we were trying to implement : + +int summation(int start_val, int end_val) { + int sum = 0; + for (int i = start_val; i <= end_val; ++i) { + sum += i; + } + return sum; +} + +['0,0,6,1\t23\tS#FS#1_2\tI#compound_statement#{$$$}\t3\tI#declaration#int$;\t1\tI#init_declarator#$=$\t2\tvsum\t-1\t19\tN0\tI#for_statement#for($$;$)$\t4\tI#declaration#int$;\t1\tI#init_declarator#$=$\t2\tvi\t-1\t12\tvstart_val\t-1\t-1\tI#binary_expression#$<=$\t2\tvi\t9\t15\tvend_val\t-1\t-1\tI#update_expression#++$\t1\tvi\t12\t20\tI#compound_statement#{$}\t1\tI#expression_statement#$;\t1\tI#assignment_expression#$+=$\t2\tvsum\t4\t22\tvi\t15\t-1\tI#return_statement#return$;\t1\tvsum\t19\t-1\t'] + +-> 0,0,6,1 being the source range (start_row, start_col, end_row, end_col) +-> first number is the total number of nodes, here 23 +""" + + + +class MyCassVisitor(CASSVisitor): + + def __init__(self): + super().__init__() + self.scopes = [] # keeping track of scopes to differenciate between local/global + self.function_nesting_level = 0 + + def visitProg(self, ctx: CASSParser.ProgContext): + + root = CassNode("removed") # Root node to remove later + + for statement in ctx.statement(): + node = self.visit(statement) + + if isinstance(node, CassNode): + # If the node is a top-level function, treat it separately + if node.label.startswith("S#FS#"): + root.add_child(node) + else: + # Other statements or nested functions are added normally + if root.children: + root.children[-1].add_child(node) + else: + root.add_child(node) + + return root + + def visitFunctionDefinition(self, ctx: CASSParser.FunctionDefinitionContext): + """ + If we're at the top (most global) level, we produce an "S#FS#..." node. + If it's nested (within another function), we produce an "I#function_definition#...". + But in both cases, we push a scope so that parameters and local variables become local. + """ + + self.function_nesting_level += 1 + # 1) Push a new scope so that parameters/locals are recognized as local + self.scopes.append(set()) + in_global_scope = (self.function_nesting_level == 1) + + # 2) Build the function node label + func_type_text = ctx.typeSpec().getText() + params_num = 0 + if ctx.parameterList(): + params_num = len(ctx.parameterList().parameter()) + + if in_global_scope: + # This is the very first function => produce "S#FS#..." style + func_type = 0 if func_type_text == 'void' else 1 + # Possibly clamp param count + if params_num > 2: + params_num = 2 + node = CassNode(f"S#FS#{func_type}_{params_num}") + + start_line = ctx.start.line -1 + start_col = ctx.start.column + end_line = ctx.stop.line -1 + end_col = ctx.stop.column +1 + + node.source_range = (start_line, start_col, end_line, end_col) + else: + # Nested function => produce "I#function_definition#..." style + node = CassNode(f"I#function_definition#{func_type_text}$$") + + + if not in_global_scope: + # Create "I#function_declarator#$$" or similar + if params_num == 0: + decl_label = "I#function_declarator#$()" + else: + decl_label = "I#function_declarator#$$" + decl_node = CassNode(decl_label) + + # The function name (the grammar has "primaryExpression" after typeSpec) + func_name = ctx.primaryExpression().getText() + decl_node.add_child(CassNode(f"v{func_name}")) + + # If there are parameters, build the param list (which also adds them to scope) + if ctx.parameterList(): + param_list_node = self.visitParameterList(ctx.parameterList()) + decl_node.add_child(param_list_node) + + node.add_child(decl_node) + else: + + if ctx.parameterList(): + self.visitParameterList(ctx.parameterList()) # Adds param names to scope + + # 4) Visit the compound statement so local declarations become part of the scope + block_node = self.visit(ctx.compoundStatement()) + node.add_child(block_node) + + # 5) Pop the scope after finishing + self.scopes.pop() + + self.function_nesting_level -= 1 + + return node + + def visitParameterList(self, ctx: CASSParser.ParameterListContext): + + num_params = len(ctx.parameter()) + placeholders = ",".join(["$"] * num_params) + node = CassNode(f'I#parameter_list#({placeholders})') + #node.add_child(CassNode(f"{num_params}")) + for p in ctx.parameter(): + node.add_child(self.visit(p)) + return node + + def visitParameter(self, ctx: CASSParser.ParameterContext): + + param_type = ctx.typeSpec().getText() + param_name = ctx.primaryExpression().getText() + + if self.scopes: + self.scopes[-1].add(param_name) + + node = CassNode(f"I#parameter_declaration#{param_type}$") + #node.add_child(CassNode("1")) + node.add_child(self.visit(ctx.primaryExpression())) + + return node + + def visitCompoundStatement(self, ctx: CASSParser.CompoundStatementContext): + # 1) Push a new empty set for local declarations in this block + self.scopes.append(set()) + + # Count the number of direct statements (children) in the compound statement + num_children = len(ctx.statement()) + dollar_signs = "$" * num_children # Create the correct number of $ placeholders + block_node = CassNode(f"I#compound_statement#{{{dollar_signs}}}") + #block_node.add_child(CassNode(F"{num_children}")) + block_node.is_in_comp_stmt = True + + # Add each statement as a direct child + for st in ctx.statement(): + stmt_node = self.visit(st) + #stmt_node.is_in_comp_stmt = True + block_node.add_child(stmt_node) + + # 4) Pop the scope after leaving this block + self.scopes.pop() + return block_node + + def visitIncludeStatement(self, ctx: CASSParser.IncludeStatementContext): + return CassNode("removed") + + def visitDeclarationStatement(self, ctx: CASSParser.DeclarationStatementContext): + + type_label = ctx.typeSpec().getText() + + decl_node = CassNode(f"I#declaration#{type_label}$;") + + #Array handling + if ctx.arrayDeclarator(): + + if ctx.emptyInitializer() or ctx.nullptr() or ctx.expression() : + + placeholder = '$' + + array_decl = self.visit(ctx.arrayDeclarator()) + + if(ctx.emptyInitializer()): + placeholder = '{}' + + if(ctx.nullptr()): + placeholder = "nullptr" + + if ctx.expression(): + helperNode = self.visit(ctx.expression()) + array_decl.add_child(helperNode) + + + init_decl = CassNode(f"I#init_declarator#$={placeholder}") + init_decl.add_child(array_decl) + decl_node.add_child(init_decl) + + else: + + decl_node.add_child(self.visit(ctx.arrayDeclarator())) + + return decl_node + + + if ctx.primaryExpression(): + + # Mark this variable as local in the top scope + var_name = ctx.primaryExpression().getText() + + if len(self.scopes) > 0: + self.scopes[-1].add(var_name) + + pointer_node = CassNode("I#pointer_declarator#*$") + + if ctx.POINTER() and not(ctx.nullptr()) and not(ctx.emptyInitializer()) and not(ctx.expression()) : + + pointer_node.add_child(self.visit(ctx.primaryExpression())) + decl_node.add_child(pointer_node) + return decl_node + + if ctx.expression() or ctx.nullptr() or ctx.emptyInitializer(): + + placeholder = '$' + + if(ctx.emptyInitializer()): + placeholder = '{}' + + if(ctx.nullptr()): + placeholder = "nullptr" + + if ctx.expression(): + helperNode = self.visit(ctx.expression()) + + assign_node = CassNode(f"I#init_declarator#$={placeholder}") + + if(ctx.POINTER()): + + pointer_node.add_child(self.visit(ctx.primaryExpression())) + + if ctx.expression(): + pointer_node.add_child(helperNode) + + assign_node.add_child(pointer_node) + + else : + + assign_node.add_child(self.visit(ctx.primaryExpression())) + + if ctx.expression(): + assign_node.add_child(helperNode) + + + decl_node.add_child(assign_node) + + else: + + decl_node.add_child(self.visit(ctx.primaryExpression())) + + return decl_node + + + def visitListInitializer(self, ctx: CASSParser.ListInitializerContext): + + placeholders = ",".join(["$"] * len(ctx.primaryExpression())) + list_init = CassNode(f"I#initializer_list#{{{placeholders}}}") + for c in ctx.primaryExpression(): + list_init.add_child(self.visit(c)) + + return list_init + + def visitForBlockStatement(self, ctx: CASSParser.ForBlockStatementContext): + + for_node = CassNode(f"I#for_statement#for($$;$)$") + #for_node.add_child(CassNode("4")) + + # Initialization (forInit) + if ctx.declarationStatement(): + init_node = self.visit(ctx.declarationStatement()) + else: + init_node = self.visit(ctx.assignmentExpression()) + + for_node.add_child(init_node) + + cond_node = self.visit(ctx.logicalOrExpression()) + for_node.add_child(cond_node) + + # Update (forUpdate) + if ctx.unaryExpression(): + update_node = self.visit(ctx.unaryExpression()) + else: + for_node.add_child(CassNode("EMPTY_UPDATE")) + + for_node.add_child(update_node) + + + # Body (multiple statements in the block) + for_node.add_child(self.visit(ctx.compoundStatement())) + + return for_node + + + def visitForSingleStatement(self, ctx: CASSParser.ForSingleStatementContext): + for_node = CassNode("I#for_statement#for($$;$)$") + #for_node.add_child(CassNode("4")) + + # Initialization (forInit) + if ctx.forInit(): + init_node = self.visit(ctx.forInit()) + for_node.add_child(init_node) + else: + for_node.add_child(CassNode("EMPTY_INIT")) + + # Condition + if ctx.expression(): + cond_node = self.visit(ctx.expression()) + for_node.add_child(cond_node) + else: + for_node.add_child(CassNode("EMPTY_COND")) + + # Update (forUpdate) + if ctx.forUpdate(): + update_node = self.visit(ctx.forUpdate()) + for_node.add_child(update_node) + else: + for_node.add_child(CassNode("EMPTY_UPDATE")) + + # Body (single statement) + body_node = self.visit(ctx.statement()) + for_node.add_child(body_node) + + + return for_node + + def visitConditionClause(self, ctx: CASSParser.ConditionClauseContext): + node = CassNode("I#condition_clause#($)") + + if ctx.logicalOrExpression(): + node.add_child(self.visit(ctx.logicalOrExpression())) + + return node + + + def visitWhileBlockStatement(self, ctx: CASSParser.WhileBlockStatementContext): + + while_node = CassNode("I#while_statement#while$$") + + # Condition + cond_node = self.visit(ctx.conditionClause()) + while_node.add_child(cond_node) + while_node.add_child(self.visit(ctx.compoundStatement())) + + return while_node + + def visitWhileSingleStatement(self, ctx: CASSParser.WhileSingleStatementContext): + + while_node = CassNode("I#while_statement#while$$") + + # Condition + cond_node = self.visit(ctx.conditionClause()) + while_node.add_child(cond_node) + + # Single body statement + body_node = self.visit(ctx.statement()) + while_node.add_child(body_node) + + return while_node + + def visitIfBlockStatement(self, ctx: CASSParser.IfBlockStatementContext): + + num_children = 0 + if ctx.conditionClause(): + num_children += 1 + + if ctx.compoundStatement(): + num_children += 1 + + if ctx.elseClause(): + num_children += 1 + + dollar_signs = "$" * num_children # Create the correct number of $ placeholders + + # Create a node for the "if" statement + if_node = CassNode(f"I#if_statement#if{dollar_signs}") + + cond_node = self.visit(ctx.conditionClause()) + if_node.add_child(cond_node) + + # Separate "if" and "else" blocks + # Visit the 'if' body (compoundStatement) and add as a child + if_body_node = self.visit(ctx.compoundStatement()) + if_node.add_child(if_body_node) + + # Handle 'else' clause if present + if ctx.elseClause(): + else_clause_node = self.visit(ctx.elseClause()) + if_node.add_child(else_clause_node) + + return if_node + + def visitElseClause(self, ctx: CASSParser.ElseClauseContext): + else_node = CassNode("I#else_clause#else$") + + if ctx.ifBlockStatement(): + nested_if_node = self.visit(ctx.ifBlockStatement()) + else_node.add_child(nested_if_node) + elif ctx.compoundStatement(): + else_body_node = self.visit(ctx.compoundStatement()) + else_node.add_child(else_body_node) + else: + # It's a simple 'else' -> visit the statement + else_body_node = self.visit(ctx.statement()) + else_node.add_child(else_body_node) + + return else_node + + + + def visitIfSingleStatement(self, ctx: CASSParser.IfSingleStatementContext): + num_children = 0 + if ctx.conditionClause(): + num_children += 1 + + if ctx.statement(): + num_children += 1 + + if ctx.elseClause(): + num_children += 1 + + dollar_signs = "$" * num_children # Create the correct number of $ placeholders + + # Create a node for the "if" statement + if_node = CassNode(f"I#if_statement#if{dollar_signs}") + + # Condition + cond_node = self.visit(ctx.conditionClause()) + if_node.add_child(cond_node) + + # Single "if" body statement + if_body_node = self.visit(ctx.statement()) + if_node.add_child(if_body_node) + + # Optional "else" + if ctx.elseClause(): + else_node = self.visit(ctx.elseClause()) + if_node.add_child(else_node) + + return if_node + + def visitSwitchStatement(self, ctx: CASSParser.SwitchStatementContext): + + switch_node = CassNode("I#switch_statement#switch$$") + switch_node.add_child(self.visit(ctx.conditionClause())) + switch_node.add_child(self.visit(ctx.compoundStatement())) + + return switch_node + + def visitCaseStatement(self, ctx: CASSParser.CaseStatementContext): + + case_name = 'case$' + has_break = '' + + if ctx.breakExpression(): + has_break = 'break' + + if ctx.defaultExpression(): + case_name = 'default' + + num_statement = len(ctx.statement()) + placeholder = "$" * num_statement + + case_node = CassNode(f"I#case_statement#{case_name}:{placeholder}{has_break}") + + if(ctx.primaryExpression()): + case_node.add_child(self.visit(ctx.primaryExpression())) + + for c in ctx.statement(): + case_node.add_child(self.visit(c)) + + return case_node + + def visitLogicalOrExpression(self, ctx: CASSParser.LogicalOrExpressionContext): + if len(ctx.logicalAndExpression()) == 1: + # If there is only one logicalAndExpression, visit it directly + return self.visit(ctx.logicalAndExpression(0)) + + # Otherwise, create a node to represent the OR operation + node = CassNode("I#binary_expression#$||$") + + + for expr in ctx.logicalAndExpression(): + node.add_child(self.visit(expr)) + + return node + + def visitLogicalAndExpression(self, ctx: CASSParser.LogicalAndExpressionContext): + if len(ctx.equalityExpression()) == 1: + return self.visit(ctx.equalityExpression(0)) + + node = CassNode("I#binary_expression#$&&$") + + + for expr in ctx.equalityExpression(): + node.add_child(self.visit(expr)) + + return node + + def visitEqualityExpression(self, ctx: CASSParser.EqualityExpressionContext): + if len(ctx.relationalExpression()) == 1: + return self.visit(ctx.relationalExpression(0)) + + node = CassNode(f"I#binary_expression#${ctx.getChild(1).getText()}$") + + + lhs = self.visit(ctx.relationalExpression(0)) # Left operand + rhs = self.visit(ctx.relationalExpression(1)) # Right operand + + node.add_child(lhs) + node.add_child(rhs) + + return node + + def visitRelationalExpression(self, ctx: CASSParser.RelationalExpressionContext): + # If there's only one child additiveExpression, just pass it up the chain + if len(ctx.children) == 1: + return self.visit(ctx.additiveExpression(0)) + + # If there's an operator like "<=" or ">" ... + left = self.visit(ctx.additiveExpression(0)) + op = ctx.getChild(1).getText() # e.g. "<=" + right = self.visit(ctx.additiveExpression(1)) + + # Create a node labeled "$<=$" (or "$>$" etc.) + node = CassNode(f"I#binary_expression#${op}$") + node.add_child(left) + node.add_child(right) + return node + + def visitAdditiveExpression(self, ctx: CASSParser.AdditiveExpressionContext): + # If there's only one child, pass it up the chain (e.g., "a") + if len(ctx.children) == 1: + return self.visit(ctx.multiplicativeExpression(0)) + + # If there are multiple operands, create a node for each operator and operand + operands = ctx.multiplicativeExpression() + result = self.visit(operands[0]) # Start with the first operand + + for i in range(1, len(operands)): + operator = ctx.getChild(2 * i - 1).getText() # Get "+" or "-" + next_operand = self.visit(operands[i]) + operator_node = CassNode(f"I#binary_expression#${operator}$") + #operator_node.add_child(CassNode("2")) + operator_node.add_child(result) + operator_node.add_child(next_operand) + result = operator_node # Update the result to the new operator node + + return result + + def visitMultiplicativeExpression(self, ctx: CASSParser.MultiplicativeExpressionContext): + # If there's only one child, pass it up the chain (e.g., "a") + if len(ctx.children) == 1: + return self.visit(ctx.unaryExpression(0)) + + # If there are multiple operands, create a node for each operator and operand + operands = ctx.unaryExpression() + result = self.visit(operands[0]) # Start with the first operand + + for i in range(1, len(operands)): + operator = ctx.getChild(2 * i - 1).getText() # Get "*" or "/" + next_operand = self.visit(operands[i]) + operator_node = CassNode(f"I#binary_expression#${operator}$") + #operator_node.add_child(CassNode("2")) + operator_node.add_child(result) + operator_node.add_child(next_operand) + result = operator_node # Update the result to the new operator node + + return result + + + + def visitFunctionCall(self, ctx: CASSParser.FunctionCallContext): + + # 1) The function name is the ID + func_name = ctx.ID().getText() # e.g. "init" + + # call_expression always has 2 children: name and parameter list + call_node = CassNode("I#call_expression#$$") + + # 3) First child = "F", e.g. Finit + func_node = CassNode(f"F{func_name}") + call_node.add_child(func_node) + + # 4) Second child = the argument list (which might be empty) + if ctx.argumentList(): + arg_list_node = self.visit(ctx.argumentList()) + call_node.add_child(arg_list_node) + else: + # No arguments => #argument_list#() with zero placeholders + empty_args = CassNode("I#argument_list#()") + call_node.add_child(empty_args) + + return call_node + + + def visitArgumentList(self, ctx: CASSParser.ArgumentListContext): + """ + Grammar snippet: + argumentList + : expression (',' expression)* # ArgumentList + ; + """ + # Count how many arguments we have + num_args = len(ctx.expression()) + + # Create a label like #argument_list#($,$,$...) with as many $ as arguments + placeholders = ",".join(["$"] * num_args) # Join $ with commas if more than one + arg_list_node = CassNode(f"I#argument_list#({placeholders})") + + + # For each expression argument, visit it and add as a child + for expr_ctx in ctx.expression(): + arg_node = self.visit(expr_ctx) + arg_list_node.add_child(arg_node) + + return arg_list_node + + + def visitReturnStatement(self, ctx: CASSParser.ReturnStatementContext): + # e.g. "return sum;" + node = CassNode("I#return_statement#return$;") + if ctx.expression(): + expr_node = self.visit(ctx.expression()) + node.add_child(expr_node) + return node + + def visitExpressionStatement(self, ctx: CASSParser.ExpressionStatementContext): + + statement_node = CassNode("I#expression_statement#$;") + + # 2) Visit the expression, which might yield something like "$+=$" + expr_node = self.visit(ctx.expression()) + + # 3) Add it as a child + statement_node.add_child(expr_node) + + return statement_node + + + # --------------------- + # Expression Collapsing + # --------------------- + def visitExpression(self, ctx: CASSParser.ExpressionContext): + + if ctx.assignmentExpression(): + return self.visit(ctx.assignmentExpression()) + + return None + + + def visitAssignmentExpression(self, ctx: CASSParser.AssignmentExpressionContext): + # Distinguish between: + # unaryExpression assignmentOperator assignmentExpression + # vs + # logicalOrExpression + + if ctx.assignmentOperator(): + # e.g. b = b + 1 + op_text = ctx.assignmentOperator().getText() # '=' or '+=' or ... + + placeholder = '$' + + if ctx.nullptr(): + placeholder = 'nullptr' + + if ctx.emptyInitializer(): + placeholder = '{}' + + # Use a node labeled #assignment_expression#$ + # For a simple '=' you might produce '#assignment_expression#$=$' + # For '+=' maybe '#assignment_expression#$+=$', etc. + node = CassNode(f"I#assignment_expression#$" + op_text + placeholder) + + lhs = self.visit(ctx.unaryExpression()) # e.g. b + node.add_child(lhs) + + if ctx.assignmentExpression(): + rhs = self.visit(ctx.assignmentExpression()) # e.g. b + 1 + node.add_child(rhs) + + + return node + else: + # No assignment operator => just pass logicalOrExpression up + return self.visit(ctx.logicalOrExpression()) + + + def visitUnaryExpression(self, ctx: CASSParser.UnaryExpressionContext): + + if ctx.listInitializer(): + return self.visit(ctx.listInitializer()) + + if ctx.pointerExpression(): + return self.visit(ctx.pointerExpression()) + + # If it's prefix like ++i + if ctx.unaryExpression(): + op = ''.join('$' if x not in ('+', '-') else x for x in ctx.getText()) + node = CassNode(f"I#update_expression#{op}") + node.add_child(self.visit(ctx.unaryExpression())) + return node + else: + + return self.visit(ctx.primaryExpression()) + + def isLocal(self, var_name: str) -> bool: + # Search from the top of the stack downward + for scope_set in reversed(self.scopes): + if var_name in scope_set: + return True + return False + + def visitPointerExpression(self, ctx: CASSParser.PointerExpressionContext): + + var_text = ctx.primaryExpression().getText() + sign = ctx.getText()[0] + + if self.isLocal(var_text): + ptr_node = CassNode(f"I#pointer_expression#{sign}$") + ptr_node.add_child(self.visit(ctx.primaryExpression())) + else: + ptr_node = CassNode(f"I#pointer_expression#{sign}$") + ptr_node.add_child(self.visit(ctx.primaryExpression())) + + return ptr_node + + def visitArrayDeclarator(self, ctx: CASSParser.ArrayDeclaratorContext): + + + if len(ctx.primaryExpression()) > 1: + + var_name = ctx.primaryExpression(0).getText() + + if len(self.scopes) > 0: + self.scopes[-1].add(var_name) + + arr_dclr = CassNode("I#array_declarator#$[$]") + arr_dclr.add_child(self.visit(ctx.primaryExpression(0))) + arr_dclr.add_child(self.visit(ctx.primaryExpression(1))) + + elif len(ctx.primaryExpression()) == 1: + + var_name = ctx.primaryExpression(0).getText() + + if len(self.scopes) > 0: + self.scopes[-1].add(var_name) + + arr_dclr = CassNode("I#array_declarator#$[]") + arr_dclr.add_child(self.visit(ctx.primaryExpression(0))) + + return arr_dclr + + + def visitPrimaryExpression(self, ctx: CASSParser.PrimaryExpressionContext): + # Case 1: It's an identifier + if ctx.ID(): + + var_text = ctx.ID().getText() + + # Check if var_text is declared in the current or any parent scope + if self.isLocal(var_text): + return CassNode(f"v{var_text}") + else: + return CassNode(f"V{var_text}") + + + # Case 2: It's an integer literal + elif ctx.INT(): + lit_text = ctx.INT().getText() + return CassNode(f"N{lit_text}") + + # Case 3: It's a float literal + elif ctx.FLOAT(): + lit_text = ctx.FLOAT().getText() + return CassNode(f"N{lit_text}") + + elif ctx.CHAR(): + lit_text = ctx.CHAR().getText() + return CassNode(f"C{lit_text}") + + elif ctx.STRING(): + str_text = ctx.STRING().getText() + return CassNode(f"S{str_text}") + + # Case 4: It's parentheses => ( expression ) + elif ctx.expression(): + # 1) Visit the sub-expression + subexpr_node = self.visit(ctx.expression()) + + # 2) Check if subexpr_node is an additive expression + # For example, if your additive visitor produces "$+$" or "$-$" as the label: + if subexpr_node and subexpr_node.label in {"I#binary_expression#$+$", "I#binary_expression#$-$", "I#binary_expression#$*$", "I#binary_expression#$/$", "I#binary_expression#$%$"}: + # Create a paren node + paren_node = CassNode("I#parenthesized_expression#($)") + paren_node.add_child(subexpr_node) + return paren_node + else: + # If not additive, just return the inner expression without special wrapping + return subexpr_node + + elif ctx.functionCall(): + return self.visit(ctx.functionCall()) + + # Fallback if something unexpected + else: + return CassNode("???") + diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/README.md b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/README.md new file mode 100644 index 00000000000..33f7ca17aa4 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/README.md @@ -0,0 +1,70 @@ +# CASS Parsing and AST Representation + +This repository implements a CASS (Context Aware Semantics Structure) parser using ANTLR4. It consists of the following key components: + +- **`CASS.g4`**: Defines the grammar for parsing C-like syntax using ANTLR4. +- **`MyCASSVisitor.py`**: Implements a visitor pattern to generate and traverse the parse tree. +- **`DriverCASS.py`**: Acts as the main entry point for parsing and processing CASS input. +- **`CASSNode.py`**: Defines the Cass node structure and serialization utilities. + +--- + +## CASS Grammar (`CASS.g4`) +This file defines the ANTLR4 grammar for parsing a subset of C-like syntax, including: +- Function definitions +- Statements (if, while, for, return, switch, case etc.) +- Expressions (arithmetic, logical, assignment) +- Parenthesized expressions +- Function calls +- Variable declarations +- Arrays, lists and pointers + +The grammar ensures a well-structured parse tree that is then visited by `MyCASSVisitor.py`. + +--- + +## CASS Visitor (`MyCASSVisitor.py`) +This module implements the visitor pattern for processing all parsed components using the grammar file. Key functionalities include: + +- Constructing `CASSNode`'s +- **Labeling for nodes**, including variable declarations, expressions, and operators. +- **Child management**, allowing hierarchical tree representation. +- Distinguishing between **local and global variables**. +- Recognizing **parenthesized expressions** and **operator precedence**. +- Properly formatting function calls and argument lists. + ... + +The visitor ensures a structured transformation of the parsed syntax into an intermediate AST representation. + +--- + +## Driver (`DriverCASS.py`) +The driver script serves as the main entry point for executing the CASS parsing pipeline. It: +- Loads and **compiles the grammar** using ANTLR4. +- Instantiates the `MyCASSVisitor` to process the parse tree. +- Generates and prints the corresponding AST structure. +- Serializes the AST into the expected CASS string format. + +This script acts as the core engine for testing and processing input files. + +--- + +## Node Representation (`CASSNode.py`) +This file defines the `CassNode` class, which represents nodes in our Cass tree. It includes: +- **Serialization to CASS format**, ensuring proper formatting for output. +- **GraphViz DOT export**, enabling visualization of the tree structure. + +The `CassNode` class provides the foundational structure for storing and manipulating AST representations. + +--- + +## How to Run +Ensure you have ANTLR4 installed and available in your environment. To run the parser: +``` +java -jar "antlr-4.13.2-complete.jar" -Dlanguage=Python3 -visitor CASS.g4 +python DriverCASS.py +``` + +## Our Jupyter Notebook +We also created a Jupyter Notebook Execution.ipynb with integrated vectorization and similarity score calculation using a pretrained graph neural network provided by the authors of the MISIM paper. In order to run it, it might be necessary to install some packages. + diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/antlr-4.13.2-complete.jar b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/antlr-4.13.2-complete.jar new file mode 100644 index 00000000000..75bfcc39763 Binary files /dev/null and b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/antlr-4.13.2-complete.jar differ diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/cass.dot b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/cass.dot new file mode 100644 index 00000000000..fa8369c904b --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/cass.dot @@ -0,0 +1,50 @@ +digraph CASS { + node [shape=ellipse]; + n1 [label="[1]: S#FS#1_0"]; + n2 [label="[2]: I#compound_statement#{$$$}"]; + n3 [label="[3]: I#declaration#int$;"]; + n4 [label="[4]: I#init_declarator#$=$"]; + n5 [label="[5]: vn"]; + n6 [label="[6]: N10"]; + n7 [label="[7]: I#while_statement#while$$"]; + n8 [label="[8]: I#condition_clause#($)"]; + n9 [label="[9]: I#binary_expression#$<=$"]; + n10 [label="[10]: Vtotal"]; + n11 [label="[11]: vn"]; + n12 [label="[12]: I#compound_statement#{$$}"]; + n13 [label="[13]: I#expression_statement#$;"]; + n14 [label="[14]: I#assignment_expression#$=$"]; + n15 [label="[15]: Vtotal"]; + n16 [label="[16]: N10"]; + n17 [label="[17]: I#expression_statement#$;"]; + n18 [label="[18]: I#assignment_expression#$=$"]; + n19 [label="[19]: Vi"]; + n20 [label="[20]: I#binary_expression#$+$"]; + n21 [label="[21]: Vi"]; + n22 [label="[22]: N1"]; + n23 [label="[23]: I#return_statement#return$;"]; + n24 [label="[24]: N0"]; + n1 -> n2; + n2 -> n3; + n3 -> n4; + n4 -> n5; + n4 -> n6; + n2 -> n7; + n7 -> n8; + n8 -> n9; + n9 -> n10; + n9 -> n11; + n7 -> n12; + n12 -> n13; + n13 -> n14; + n14 -> n15; + n14 -> n16; + n12 -> n17; + n17 -> n18; + n18 -> n19; + n18 -> n20; + n20 -> n21; + n20 -> n22; + n2 -> n23; + n23 -> n24; +} \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/cass.png b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/cass.png new file mode 100644 index 00000000000..f0eb14959f4 Binary files /dev/null and b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/cass.png differ diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/input_code_ez.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/input_code_ez.c new file mode 100644 index 00000000000..0cac291d566 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/input_code_ez.c @@ -0,0 +1,10 @@ +int main() { + int n, total = 0, i = 1; + scanf("%d", &n); + while (i <= n) { + total += i; + i++; + } + printf("%d\n", total); + return 0; +} \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/input_code_og.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/input_code_og.c new file mode 100644 index 00000000000..d46d32781f1 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/input_code_og.c @@ -0,0 +1,7 @@ +int summation(int start_val, int end_val) { + int sum = 0; + for (int i = start_val; i <= end_val; ++i) { + sum += i; + } + return sum; +} diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/requirements.txt b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/requirements.txt new file mode 100644 index 00000000000..7a967d5e2f7 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/requirements.txt @@ -0,0 +1 @@ +antlr4-python3-runtime==4.13.0 \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_1.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_1.c new file mode 100644 index 00000000000..2181f3cc550 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_1.c @@ -0,0 +1,7 @@ +int addValues(int begin, int finish) { + int total = 0; + for (int idx = begin; idx <= finish; idx++) { + total += idx; + } + return total; +} \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_2.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_2.c new file mode 100644 index 00000000000..1e867713b68 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_2.c @@ -0,0 +1,7 @@ +int summation(int start_val, int end_val) { + int sum = 0; + for (int i = start_val; i <= end_val; ++i) { + sum += i; + } + return sum; +} \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_3.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_3.c new file mode 100644 index 00000000000..10c40731542 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_3.c @@ -0,0 +1,7 @@ +int sumNumbers(int start, int end) { + int sum = 0; + for (int i = start; i <= end; i++) { + sum += i; + } + return sum; +} diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_4.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_4.c new file mode 100644 index 00000000000..84cfac2091c --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_4.c @@ -0,0 +1,9 @@ +int sumNumbers(int start, int end) { + int sum = 0; + int i = start; + while (i <= end) { + sum += i; + i++; + } + return sum; +} diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_5.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_5.c new file mode 100644 index 00000000000..6e28b2f6408 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_5.c @@ -0,0 +1,12 @@ +int calc_factorial(int n) { + if (n < 0) { + // Factorial not defined for negative numbers + return -1; + } else if (n == 0 || n == 1) { + return 1; + } else { + return n * factorial(n - 1); + } +} + + diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_6.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_6.c new file mode 100644 index 00000000000..7043e7c0eaa --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_6.c @@ -0,0 +1,20 @@ +int main() { + int num; + + + if (num < 0) { + printf("Error: Negative input is not allowed.\n"); + return 1; + } + + float result = 1; + int counter = 1; + + while (counter <= num) { + result *= counter; + counter++; + } + + printf("Factorial of %d is %lld\n", num, result); + return 0; +} \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_7.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_7.c new file mode 100644 index 00000000000..42eeee4ff53 --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_7.c @@ -0,0 +1,10 @@ +int main() { + int n = 0; + int sum = 0; + scanf("%d", &n); + for (int i = 1; i <= n; i++) { + sum += i; + } + printf("%d\n", sum); + return 0; +} \ No newline at end of file diff --git a/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_8.c b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_8.c new file mode 100644 index 00000000000..84739bb7c4b --- /dev/null +++ b/src/main/python/[SYSTEMDS-3191] Entity Resolution for Plagiarism Detection/test_codes/input_code_8.c @@ -0,0 +1,8 @@ +int main(int a) { + x = "this cass logi was very hard to implement"; + int total = 25; + string = x + total; + return string; + + +} \ No newline at end of file