smc_clc.c 37 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370
  1. // SPDX-License-Identifier: GPL-2.0
  2. /*
  3. * Shared Memory Communications over RDMA (SMC-R) and RoCE
  4. *
  5. * CLC (connection layer control) handshake over initial TCP socket to
  6. * prepare for RDMA traffic
  7. *
  8. * Copyright IBM Corp. 2016, 2018
  9. *
  10. * Author(s): Ursula Braun <ubraun@linux.vnet.ibm.com>
  11. */
  12. #include <linux/in.h>
  13. #include <linux/inetdevice.h>
  14. #include <linux/if_ether.h>
  15. #include <linux/sched/signal.h>
  16. #include <linux/utsname.h>
  17. #include <linux/ctype.h>
  18. #include <net/addrconf.h>
  19. #include <net/sock.h>
  20. #include <net/tcp.h>
  21. #include "smc.h"
  22. #include "smc_core.h"
  23. #include "smc_clc.h"
  24. #include "smc_ib.h"
  25. #include "smc_ism.h"
  26. #include "smc_netlink.h"
  27. #define SMCR_CLC_ACCEPT_CONFIRM_LEN 68
  28. #define SMCD_CLC_ACCEPT_CONFIRM_LEN 48
  29. #define SMCD_CLC_ACCEPT_CONFIRM_LEN_V2 78
  30. #define SMCR_CLC_ACCEPT_CONFIRM_LEN_V2 108
  31. #define SMC_CLC_RECV_BUF_LEN 100
  32. /* eye catcher "SMCR" EBCDIC for CLC messages */
  33. static const char SMC_EYECATCHER[4] = {'\xe2', '\xd4', '\xc3', '\xd9'};
  34. /* eye catcher "SMCD" EBCDIC for CLC messages */
  35. static const char SMCD_EYECATCHER[4] = {'\xe2', '\xd4', '\xc3', '\xc4'};
  36. static u8 smc_hostname[SMC_MAX_HOSTNAME_LEN];
  37. struct smc_clc_eid_table {
  38. rwlock_t lock;
  39. struct list_head list;
  40. u8 ueid_cnt;
  41. u8 seid_enabled;
  42. };
  43. static struct smc_clc_eid_table smc_clc_eid_table;
  44. struct smc_clc_eid_entry {
  45. struct list_head list;
  46. u8 eid[SMC_MAX_EID_LEN];
  47. };
  48. /* The size of a user EID is 32 characters.
  49. * Valid characters should be (single-byte character set) A-Z, 0-9, '.' and '-'.
  50. * Blanks should only be used to pad to the expected size.
  51. * First character must be alphanumeric.
  52. */
  53. static bool smc_clc_ueid_valid(char *ueid)
  54. {
  55. char *end = ueid + SMC_MAX_EID_LEN;
  56. while (--end >= ueid && isspace(*end))
  57. ;
  58. if (end < ueid)
  59. return false;
  60. if (!isalnum(*ueid) || islower(*ueid))
  61. return false;
  62. while (ueid <= end) {
  63. if ((!isalnum(*ueid) || islower(*ueid)) && *ueid != '.' &&
  64. *ueid != '-')
  65. return false;
  66. ueid++;
  67. }
  68. return true;
  69. }
  70. static int smc_clc_ueid_add(char *ueid)
  71. {
  72. struct smc_clc_eid_entry *new_ueid, *tmp_ueid;
  73. int rc;
  74. if (!smc_clc_ueid_valid(ueid))
  75. return -EINVAL;
  76. /* add a new ueid entry to the ueid table if there isn't one */
  77. new_ueid = kzalloc_obj(*new_ueid);
  78. if (!new_ueid)
  79. return -ENOMEM;
  80. memcpy(new_ueid->eid, ueid, SMC_MAX_EID_LEN);
  81. write_lock(&smc_clc_eid_table.lock);
  82. if (smc_clc_eid_table.ueid_cnt >= SMC_MAX_UEID) {
  83. rc = -ERANGE;
  84. goto err_out;
  85. }
  86. list_for_each_entry(tmp_ueid, &smc_clc_eid_table.list, list) {
  87. if (!memcmp(tmp_ueid->eid, ueid, SMC_MAX_EID_LEN)) {
  88. rc = -EEXIST;
  89. goto err_out;
  90. }
  91. }
  92. list_add_tail(&new_ueid->list, &smc_clc_eid_table.list);
  93. smc_clc_eid_table.ueid_cnt++;
  94. write_unlock(&smc_clc_eid_table.lock);
  95. return 0;
  96. err_out:
  97. write_unlock(&smc_clc_eid_table.lock);
  98. kfree(new_ueid);
  99. return rc;
  100. }
  101. int smc_clc_ueid_count(void)
  102. {
  103. int count;
  104. read_lock(&smc_clc_eid_table.lock);
  105. count = smc_clc_eid_table.ueid_cnt;
  106. read_unlock(&smc_clc_eid_table.lock);
  107. return count;
  108. }
  109. int smc_nl_add_ueid(struct sk_buff *skb, struct genl_info *info)
  110. {
  111. struct nlattr *nla_ueid = info->attrs[SMC_NLA_EID_TABLE_ENTRY];
  112. char *ueid;
  113. if (!nla_ueid || nla_len(nla_ueid) != SMC_MAX_EID_LEN + 1)
  114. return -EINVAL;
  115. ueid = (char *)nla_data(nla_ueid);
  116. return smc_clc_ueid_add(ueid);
  117. }
  118. /* remove one or all ueid entries from the table */
  119. static int smc_clc_ueid_remove(char *ueid)
  120. {
  121. struct smc_clc_eid_entry *lst_ueid, *tmp_ueid;
  122. int rc = -ENOENT;
  123. /* remove table entry */
  124. write_lock(&smc_clc_eid_table.lock);
  125. list_for_each_entry_safe(lst_ueid, tmp_ueid, &smc_clc_eid_table.list,
  126. list) {
  127. if (!ueid || !memcmp(lst_ueid->eid, ueid, SMC_MAX_EID_LEN)) {
  128. list_del(&lst_ueid->list);
  129. smc_clc_eid_table.ueid_cnt--;
  130. kfree(lst_ueid);
  131. rc = 0;
  132. }
  133. }
  134. #if IS_ENABLED(CONFIG_S390)
  135. if (!rc && !smc_clc_eid_table.ueid_cnt) {
  136. smc_clc_eid_table.seid_enabled = 1;
  137. rc = -EAGAIN; /* indicate success and enabling of seid */
  138. }
  139. #endif
  140. write_unlock(&smc_clc_eid_table.lock);
  141. return rc;
  142. }
  143. int smc_nl_remove_ueid(struct sk_buff *skb, struct genl_info *info)
  144. {
  145. struct nlattr *nla_ueid = info->attrs[SMC_NLA_EID_TABLE_ENTRY];
  146. char *ueid;
  147. if (!nla_ueid || nla_len(nla_ueid) != SMC_MAX_EID_LEN + 1)
  148. return -EINVAL;
  149. ueid = (char *)nla_data(nla_ueid);
  150. return smc_clc_ueid_remove(ueid);
  151. }
  152. int smc_nl_flush_ueid(struct sk_buff *skb, struct genl_info *info)
  153. {
  154. smc_clc_ueid_remove(NULL);
  155. return 0;
  156. }
  157. static int smc_nl_ueid_dumpinfo(struct sk_buff *skb, u32 portid, u32 seq,
  158. u32 flags, char *ueid)
  159. {
  160. char ueid_str[SMC_MAX_EID_LEN + 1];
  161. void *hdr;
  162. hdr = genlmsg_put(skb, portid, seq, &smc_gen_nl_family,
  163. flags, SMC_NETLINK_DUMP_UEID);
  164. if (!hdr)
  165. return -ENOMEM;
  166. memcpy(ueid_str, ueid, SMC_MAX_EID_LEN);
  167. ueid_str[SMC_MAX_EID_LEN] = 0;
  168. if (nla_put_string(skb, SMC_NLA_EID_TABLE_ENTRY, ueid_str)) {
  169. genlmsg_cancel(skb, hdr);
  170. return -EMSGSIZE;
  171. }
  172. genlmsg_end(skb, hdr);
  173. return 0;
  174. }
  175. static int _smc_nl_ueid_dump(struct sk_buff *skb, u32 portid, u32 seq,
  176. int start_idx)
  177. {
  178. struct smc_clc_eid_entry *lst_ueid;
  179. int idx = 0;
  180. read_lock(&smc_clc_eid_table.lock);
  181. list_for_each_entry(lst_ueid, &smc_clc_eid_table.list, list) {
  182. if (idx++ < start_idx)
  183. continue;
  184. if (smc_nl_ueid_dumpinfo(skb, portid, seq, NLM_F_MULTI,
  185. lst_ueid->eid)) {
  186. --idx;
  187. break;
  188. }
  189. }
  190. read_unlock(&smc_clc_eid_table.lock);
  191. return idx;
  192. }
  193. int smc_nl_dump_ueid(struct sk_buff *skb, struct netlink_callback *cb)
  194. {
  195. struct smc_nl_dmp_ctx *cb_ctx = smc_nl_dmp_ctx(cb);
  196. int idx;
  197. idx = _smc_nl_ueid_dump(skb, NETLINK_CB(cb->skb).portid,
  198. cb->nlh->nlmsg_seq, cb_ctx->pos[0]);
  199. cb_ctx->pos[0] = idx;
  200. return skb->len;
  201. }
  202. int smc_nl_dump_seid(struct sk_buff *skb, struct netlink_callback *cb)
  203. {
  204. struct smc_nl_dmp_ctx *cb_ctx = smc_nl_dmp_ctx(cb);
  205. char seid_str[SMC_MAX_EID_LEN + 1];
  206. u8 seid_enabled;
  207. void *hdr;
  208. u8 *seid;
  209. if (cb_ctx->pos[0])
  210. return skb->len;
  211. hdr = genlmsg_put(skb, NETLINK_CB(cb->skb).portid, cb->nlh->nlmsg_seq,
  212. &smc_gen_nl_family, NLM_F_MULTI,
  213. SMC_NETLINK_DUMP_SEID);
  214. if (!hdr)
  215. return -ENOMEM;
  216. if (!smc_ism_is_v2_capable())
  217. goto end;
  218. smc_ism_get_system_eid(&seid);
  219. memcpy(seid_str, seid, SMC_MAX_EID_LEN);
  220. seid_str[SMC_MAX_EID_LEN] = 0;
  221. if (nla_put_string(skb, SMC_NLA_SEID_ENTRY, seid_str))
  222. goto err;
  223. read_lock(&smc_clc_eid_table.lock);
  224. seid_enabled = smc_clc_eid_table.seid_enabled;
  225. read_unlock(&smc_clc_eid_table.lock);
  226. if (nla_put_u8(skb, SMC_NLA_SEID_ENABLED, seid_enabled))
  227. goto err;
  228. end:
  229. genlmsg_end(skb, hdr);
  230. cb_ctx->pos[0]++;
  231. return skb->len;
  232. err:
  233. genlmsg_cancel(skb, hdr);
  234. return -EMSGSIZE;
  235. }
  236. int smc_nl_enable_seid(struct sk_buff *skb, struct genl_info *info)
  237. {
  238. #if IS_ENABLED(CONFIG_S390)
  239. write_lock(&smc_clc_eid_table.lock);
  240. smc_clc_eid_table.seid_enabled = 1;
  241. write_unlock(&smc_clc_eid_table.lock);
  242. return 0;
  243. #else
  244. return -EOPNOTSUPP;
  245. #endif
  246. }
  247. int smc_nl_disable_seid(struct sk_buff *skb, struct genl_info *info)
  248. {
  249. int rc = 0;
  250. #if IS_ENABLED(CONFIG_S390)
  251. write_lock(&smc_clc_eid_table.lock);
  252. if (!smc_clc_eid_table.ueid_cnt)
  253. rc = -ENOENT;
  254. else
  255. smc_clc_eid_table.seid_enabled = 0;
  256. write_unlock(&smc_clc_eid_table.lock);
  257. #else
  258. rc = -EOPNOTSUPP;
  259. #endif
  260. return rc;
  261. }
  262. static bool _smc_clc_match_ueid(u8 *peer_ueid)
  263. {
  264. struct smc_clc_eid_entry *tmp_ueid;
  265. list_for_each_entry(tmp_ueid, &smc_clc_eid_table.list, list) {
  266. if (!memcmp(tmp_ueid->eid, peer_ueid, SMC_MAX_EID_LEN))
  267. return true;
  268. }
  269. return false;
  270. }
  271. bool smc_clc_match_eid(u8 *negotiated_eid,
  272. struct smc_clc_v2_extension *smc_v2_ext,
  273. u8 *peer_eid, u8 *local_eid)
  274. {
  275. bool match = false;
  276. int i;
  277. negotiated_eid[0] = 0;
  278. read_lock(&smc_clc_eid_table.lock);
  279. if (peer_eid && local_eid &&
  280. smc_clc_eid_table.seid_enabled &&
  281. smc_v2_ext->hdr.flag.seid &&
  282. !memcmp(peer_eid, local_eid, SMC_MAX_EID_LEN)) {
  283. memcpy(negotiated_eid, peer_eid, SMC_MAX_EID_LEN);
  284. match = true;
  285. goto out;
  286. }
  287. for (i = 0; i < smc_v2_ext->hdr.eid_cnt; i++) {
  288. if (_smc_clc_match_ueid(smc_v2_ext->user_eids[i])) {
  289. memcpy(negotiated_eid, smc_v2_ext->user_eids[i],
  290. SMC_MAX_EID_LEN);
  291. match = true;
  292. goto out;
  293. }
  294. }
  295. out:
  296. read_unlock(&smc_clc_eid_table.lock);
  297. return match;
  298. }
  299. /* check arriving CLC proposal */
  300. static bool smc_clc_msg_prop_valid(struct smc_clc_msg_proposal *pclc)
  301. {
  302. struct smc_clc_msg_proposal_prefix *pclc_prfx;
  303. struct smc_clc_smcd_v2_extension *smcd_v2_ext;
  304. struct smc_clc_msg_hdr *hdr = &pclc->hdr;
  305. struct smc_clc_v2_extension *v2_ext;
  306. pclc_prfx = smc_clc_proposal_get_prefix(pclc);
  307. if (!pclc_prfx ||
  308. pclc_prfx->ipv6_prefixes_cnt > SMC_CLC_MAX_V6_PREFIX)
  309. return false;
  310. if (hdr->version == SMC_V1) {
  311. if (hdr->typev1 == SMC_TYPE_N)
  312. return false;
  313. if (ntohs(hdr->length) !=
  314. sizeof(*pclc) + ntohs(pclc->iparea_offset) +
  315. sizeof(*pclc_prfx) +
  316. pclc_prfx->ipv6_prefixes_cnt *
  317. sizeof(struct smc_clc_ipv6_prefix) +
  318. sizeof(struct smc_clc_msg_trail))
  319. return false;
  320. } else {
  321. v2_ext = smc_get_clc_v2_ext(pclc);
  322. if ((hdr->typev2 != SMC_TYPE_N &&
  323. (!v2_ext || v2_ext->hdr.eid_cnt > SMC_CLC_MAX_UEID)) ||
  324. (smcd_indicated(hdr->typev2) &&
  325. v2_ext->hdr.ism_gid_cnt > SMCD_CLC_MAX_V2_GID_ENTRIES))
  326. return false;
  327. if (ntohs(hdr->length) !=
  328. sizeof(*pclc) +
  329. sizeof(struct smc_clc_msg_smcd) +
  330. (hdr->typev1 != SMC_TYPE_N ?
  331. sizeof(*pclc_prfx) +
  332. pclc_prfx->ipv6_prefixes_cnt *
  333. sizeof(struct smc_clc_ipv6_prefix) : 0) +
  334. (hdr->typev2 != SMC_TYPE_N ?
  335. sizeof(*v2_ext) +
  336. v2_ext->hdr.eid_cnt * SMC_MAX_EID_LEN : 0) +
  337. (smcd_indicated(hdr->typev2) ?
  338. sizeof(*smcd_v2_ext) + v2_ext->hdr.ism_gid_cnt *
  339. sizeof(struct smc_clc_smcd_gid_chid) :
  340. 0) +
  341. sizeof(struct smc_clc_msg_trail))
  342. return false;
  343. }
  344. return true;
  345. }
  346. /* check arriving CLC accept or confirm */
  347. static bool
  348. smc_clc_msg_acc_conf_valid(struct smc_clc_msg_accept_confirm *clc)
  349. {
  350. struct smc_clc_msg_hdr *hdr = &clc->hdr;
  351. if (hdr->typev1 != SMC_TYPE_R && hdr->typev1 != SMC_TYPE_D)
  352. return false;
  353. if (hdr->version == SMC_V1) {
  354. if ((hdr->typev1 == SMC_TYPE_R &&
  355. ntohs(hdr->length) != SMCR_CLC_ACCEPT_CONFIRM_LEN) ||
  356. (hdr->typev1 == SMC_TYPE_D &&
  357. ntohs(hdr->length) != SMCD_CLC_ACCEPT_CONFIRM_LEN))
  358. return false;
  359. } else {
  360. if (hdr->typev1 == SMC_TYPE_D &&
  361. ntohs(hdr->length) < SMCD_CLC_ACCEPT_CONFIRM_LEN_V2)
  362. return false;
  363. if (hdr->typev1 == SMC_TYPE_R &&
  364. ntohs(hdr->length) < SMCR_CLC_ACCEPT_CONFIRM_LEN_V2)
  365. return false;
  366. }
  367. return true;
  368. }
  369. /* check arriving CLC decline */
  370. static bool
  371. smc_clc_msg_decl_valid(struct smc_clc_msg_decline *dclc)
  372. {
  373. struct smc_clc_msg_hdr *hdr = &dclc->hdr;
  374. if (hdr->version == SMC_V1) {
  375. if (ntohs(hdr->length) != sizeof(struct smc_clc_msg_decline))
  376. return false;
  377. } else {
  378. if (ntohs(hdr->length) != sizeof(struct smc_clc_msg_decline_v2))
  379. return false;
  380. }
  381. return true;
  382. }
  383. static int smc_clc_fill_fce_v2x(struct smc_clc_first_contact_ext_v2x *fce_v2x,
  384. struct smc_init_info *ini)
  385. {
  386. int ret = sizeof(*fce_v2x);
  387. memset(fce_v2x, 0, sizeof(*fce_v2x));
  388. fce_v2x->fce_v2_base.os_type = SMC_CLC_OS_LINUX;
  389. fce_v2x->fce_v2_base.release = ini->release_nr;
  390. memcpy(fce_v2x->fce_v2_base.hostname,
  391. smc_hostname, sizeof(smc_hostname));
  392. if (ini->is_smcd && ini->release_nr < SMC_RELEASE_1) {
  393. ret = sizeof(struct smc_clc_first_contact_ext);
  394. goto out;
  395. }
  396. if (ini->release_nr >= SMC_RELEASE_1) {
  397. if (!ini->is_smcd) {
  398. fce_v2x->max_conns = ini->max_conns;
  399. fce_v2x->max_links = ini->max_links;
  400. }
  401. fce_v2x->feature_mask = htons(ini->feature_mask);
  402. }
  403. out:
  404. return ret;
  405. }
  406. /* check if received message has a correct header length and contains valid
  407. * heading and trailing eyecatchers
  408. */
  409. static bool smc_clc_msg_hdr_valid(struct smc_clc_msg_hdr *clcm, bool check_trl)
  410. {
  411. struct smc_clc_msg_accept_confirm *clc;
  412. struct smc_clc_msg_proposal *pclc;
  413. struct smc_clc_msg_decline *dclc;
  414. struct smc_clc_msg_trail *trl;
  415. if (memcmp(clcm->eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER)) &&
  416. memcmp(clcm->eyecatcher, SMCD_EYECATCHER, sizeof(SMCD_EYECATCHER)))
  417. return false;
  418. switch (clcm->type) {
  419. case SMC_CLC_PROPOSAL:
  420. pclc = (struct smc_clc_msg_proposal *)clcm;
  421. if (!smc_clc_msg_prop_valid(pclc))
  422. return false;
  423. trl = (struct smc_clc_msg_trail *)
  424. ((u8 *)pclc + ntohs(pclc->hdr.length) - sizeof(*trl));
  425. break;
  426. case SMC_CLC_ACCEPT:
  427. case SMC_CLC_CONFIRM:
  428. clc = (struct smc_clc_msg_accept_confirm *)clcm;
  429. if (!smc_clc_msg_acc_conf_valid(clc))
  430. return false;
  431. trl = (struct smc_clc_msg_trail *)
  432. ((u8 *)clc + ntohs(clc->hdr.length) - sizeof(*trl));
  433. break;
  434. case SMC_CLC_DECLINE:
  435. dclc = (struct smc_clc_msg_decline *)clcm;
  436. if (!smc_clc_msg_decl_valid(dclc))
  437. return false;
  438. check_trl = false;
  439. break;
  440. default:
  441. return false;
  442. }
  443. if (check_trl &&
  444. memcmp(trl->eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER)) &&
  445. memcmp(trl->eyecatcher, SMCD_EYECATCHER, sizeof(SMCD_EYECATCHER)))
  446. return false;
  447. return true;
  448. }
  449. /* find ipv4 addr on device and get the prefix len, fill CLC proposal msg */
  450. static int smc_clc_prfx_set4_rcu(struct net_device *dev, __be32 ipv4,
  451. struct smc_clc_msg_proposal_prefix *prop)
  452. {
  453. struct in_device *in_dev = __in_dev_get_rcu(dev);
  454. const struct in_ifaddr *ifa;
  455. if (!in_dev)
  456. return -ENODEV;
  457. in_dev_for_each_ifa_rcu(ifa, in_dev) {
  458. if (!inet_ifa_match(ipv4, ifa))
  459. continue;
  460. prop->prefix_len = inet_mask_len(ifa->ifa_mask);
  461. prop->outgoing_subnet = ifa->ifa_address & ifa->ifa_mask;
  462. /* prop->ipv6_prefixes_cnt = 0; already done by memset before */
  463. return 0;
  464. }
  465. return -ENOENT;
  466. }
  467. /* fill CLC proposal msg with ipv6 prefixes from device */
  468. static int smc_clc_prfx_set6_rcu(struct net_device *dev,
  469. struct smc_clc_msg_proposal_prefix *prop,
  470. struct smc_clc_ipv6_prefix *ipv6_prfx)
  471. {
  472. #if IS_ENABLED(CONFIG_IPV6)
  473. struct inet6_dev *in6_dev = __in6_dev_get(dev);
  474. struct inet6_ifaddr *ifa;
  475. int cnt = 0;
  476. if (!in6_dev)
  477. return -ENODEV;
  478. /* use a maximum of 8 IPv6 prefixes from device */
  479. list_for_each_entry(ifa, &in6_dev->addr_list, if_list) {
  480. if (ipv6_addr_type(&ifa->addr) & IPV6_ADDR_LINKLOCAL)
  481. continue;
  482. ipv6_addr_prefix(&ipv6_prfx[cnt].prefix,
  483. &ifa->addr, ifa->prefix_len);
  484. ipv6_prfx[cnt].prefix_len = ifa->prefix_len;
  485. cnt++;
  486. if (cnt == SMC_CLC_MAX_V6_PREFIX)
  487. break;
  488. }
  489. prop->ipv6_prefixes_cnt = cnt;
  490. if (cnt)
  491. return 0;
  492. #endif
  493. return -ENOENT;
  494. }
  495. /* retrieve and set prefixes in CLC proposal msg */
  496. static int smc_clc_prfx_set(struct socket *clcsock,
  497. struct smc_clc_msg_proposal_prefix *prop,
  498. struct smc_clc_ipv6_prefix *ipv6_prfx)
  499. {
  500. struct sockaddr_storage addrs;
  501. struct sockaddr_in6 *addr6;
  502. struct sockaddr_in *addr;
  503. struct net_device *dev;
  504. struct dst_entry *dst;
  505. int rc = -ENOENT;
  506. /* get address to which the internal TCP socket is bound */
  507. if (kernel_getsockname(clcsock, (struct sockaddr *)&addrs) < 0)
  508. goto out;
  509. /* analyze IP specific data of net_device belonging to TCP socket */
  510. addr6 = (struct sockaddr_in6 *)&addrs;
  511. rcu_read_lock();
  512. dst = __sk_dst_get(clcsock->sk);
  513. dev = dst ? dst_dev_rcu(dst) : NULL;
  514. if (!dev) {
  515. rc = -ENODEV;
  516. goto out_unlock;
  517. }
  518. if (addrs.ss_family == PF_INET) {
  519. /* IPv4 */
  520. addr = (struct sockaddr_in *)&addrs;
  521. rc = smc_clc_prfx_set4_rcu(dev, addr->sin_addr.s_addr, prop);
  522. } else if (ipv6_addr_v4mapped(&addr6->sin6_addr)) {
  523. /* mapped IPv4 address - peer is IPv4 only */
  524. rc = smc_clc_prfx_set4_rcu(dev, addr6->sin6_addr.s6_addr32[3],
  525. prop);
  526. } else {
  527. /* IPv6 */
  528. rc = smc_clc_prfx_set6_rcu(dev, prop, ipv6_prfx);
  529. }
  530. out_unlock:
  531. rcu_read_unlock();
  532. out:
  533. return rc;
  534. }
  535. /* match ipv4 addrs of dev against addr in CLC proposal */
  536. static int smc_clc_prfx_match4_rcu(struct net_device *dev,
  537. struct smc_clc_msg_proposal_prefix *prop)
  538. {
  539. struct in_device *in_dev = __in_dev_get_rcu(dev);
  540. const struct in_ifaddr *ifa;
  541. if (!in_dev)
  542. return -ENODEV;
  543. in_dev_for_each_ifa_rcu(ifa, in_dev) {
  544. if (prop->prefix_len == inet_mask_len(ifa->ifa_mask) &&
  545. inet_ifa_match(prop->outgoing_subnet, ifa))
  546. return 0;
  547. }
  548. return -ENOENT;
  549. }
  550. /* match ipv6 addrs of dev against addrs in CLC proposal */
  551. static int smc_clc_prfx_match6_rcu(struct net_device *dev,
  552. struct smc_clc_msg_proposal_prefix *prop)
  553. {
  554. #if IS_ENABLED(CONFIG_IPV6)
  555. struct inet6_dev *in6_dev = __in6_dev_get(dev);
  556. struct smc_clc_ipv6_prefix *ipv6_prfx;
  557. struct inet6_ifaddr *ifa;
  558. int i, max;
  559. if (!in6_dev)
  560. return -ENODEV;
  561. /* ipv6 prefix list starts behind smc_clc_msg_proposal_prefix */
  562. ipv6_prfx = (struct smc_clc_ipv6_prefix *)((u8 *)prop + sizeof(*prop));
  563. max = min_t(u8, prop->ipv6_prefixes_cnt, SMC_CLC_MAX_V6_PREFIX);
  564. list_for_each_entry(ifa, &in6_dev->addr_list, if_list) {
  565. if (ipv6_addr_type(&ifa->addr) & IPV6_ADDR_LINKLOCAL)
  566. continue;
  567. for (i = 0; i < max; i++) {
  568. if (ifa->prefix_len == ipv6_prfx[i].prefix_len &&
  569. ipv6_prefix_equal(&ifa->addr, &ipv6_prfx[i].prefix,
  570. ifa->prefix_len))
  571. return 0;
  572. }
  573. }
  574. #endif
  575. return -ENOENT;
  576. }
  577. /* check if proposed prefixes match one of our device prefixes */
  578. int smc_clc_prfx_match(struct socket *clcsock,
  579. struct smc_clc_msg_proposal_prefix *prop)
  580. {
  581. struct net_device *dev;
  582. struct dst_entry *dst;
  583. int rc;
  584. rcu_read_lock();
  585. dst = __sk_dst_get(clcsock->sk);
  586. dev = dst ? dst_dev_rcu(dst) : NULL;
  587. if (!dev) {
  588. rc = -ENODEV;
  589. goto out;
  590. }
  591. if (!prop->ipv6_prefixes_cnt)
  592. rc = smc_clc_prfx_match4_rcu(dev, prop);
  593. else
  594. rc = smc_clc_prfx_match6_rcu(dev, prop);
  595. out:
  596. rcu_read_unlock();
  597. return rc;
  598. }
  599. /* Wait for data on the tcp-socket, analyze received data
  600. * Returns:
  601. * 0 if success and it was not a decline that we received.
  602. * SMC_CLC_DECL_REPLY if decline received for fallback w/o another decl send.
  603. * clcsock error, -EINTR, -ECONNRESET, -EPROTO otherwise.
  604. */
  605. int smc_clc_wait_msg(struct smc_sock *smc, void *buf, int buflen,
  606. u8 expected_type, unsigned long timeout)
  607. {
  608. long rcvtimeo = READ_ONCE(smc->clcsock->sk->sk_rcvtimeo);
  609. struct sock *clc_sk = smc->clcsock->sk;
  610. struct smc_clc_msg_hdr *clcm = buf;
  611. struct msghdr msg = {NULL, 0};
  612. int reason_code = 0;
  613. struct kvec vec = {buf, buflen};
  614. int len, datlen, recvlen;
  615. bool check_trl = true;
  616. int krflags;
  617. /* peek the first few bytes to determine length of data to receive
  618. * so we don't consume any subsequent CLC message or payload data
  619. * in the TCP byte stream
  620. */
  621. /*
  622. * Caller must make sure that buflen is no less than
  623. * sizeof(struct smc_clc_msg_hdr)
  624. */
  625. krflags = MSG_PEEK | MSG_WAITALL;
  626. WRITE_ONCE(clc_sk->sk_rcvtimeo, timeout);
  627. iov_iter_kvec(&msg.msg_iter, ITER_DEST, &vec, 1,
  628. sizeof(struct smc_clc_msg_hdr));
  629. len = sock_recvmsg(smc->clcsock, &msg, krflags);
  630. if (signal_pending(current)) {
  631. reason_code = -EINTR;
  632. clc_sk->sk_err = EINTR;
  633. smc->sk.sk_err = EINTR;
  634. goto out;
  635. }
  636. if (clc_sk->sk_err) {
  637. reason_code = -clc_sk->sk_err;
  638. if (clc_sk->sk_err == EAGAIN &&
  639. expected_type == SMC_CLC_DECLINE)
  640. clc_sk->sk_err = 0; /* reset for fallback usage */
  641. else
  642. smc->sk.sk_err = clc_sk->sk_err;
  643. goto out;
  644. }
  645. if (!len) { /* peer has performed orderly shutdown */
  646. smc->sk.sk_err = ECONNRESET;
  647. reason_code = -ECONNRESET;
  648. goto out;
  649. }
  650. if (len < 0) {
  651. if (len != -EAGAIN || expected_type != SMC_CLC_DECLINE)
  652. smc->sk.sk_err = -len;
  653. reason_code = len;
  654. goto out;
  655. }
  656. datlen = ntohs(clcm->length);
  657. if ((len < sizeof(struct smc_clc_msg_hdr)) ||
  658. (clcm->version < SMC_V1) ||
  659. ((clcm->type != SMC_CLC_DECLINE) &&
  660. (clcm->type != expected_type))) {
  661. smc->sk.sk_err = EPROTO;
  662. reason_code = -EPROTO;
  663. goto out;
  664. }
  665. /* receive the complete CLC message */
  666. memset(&msg, 0, sizeof(struct msghdr));
  667. if (datlen > buflen) {
  668. check_trl = false;
  669. recvlen = buflen;
  670. } else {
  671. recvlen = datlen;
  672. }
  673. iov_iter_kvec(&msg.msg_iter, ITER_DEST, &vec, 1, recvlen);
  674. krflags = MSG_WAITALL;
  675. len = sock_recvmsg(smc->clcsock, &msg, krflags);
  676. if (len < recvlen || !smc_clc_msg_hdr_valid(clcm, check_trl)) {
  677. smc->sk.sk_err = EPROTO;
  678. reason_code = -EPROTO;
  679. goto out;
  680. }
  681. datlen -= len;
  682. while (datlen) {
  683. u8 tmp[SMC_CLC_RECV_BUF_LEN];
  684. vec.iov_base = &tmp;
  685. vec.iov_len = SMC_CLC_RECV_BUF_LEN;
  686. /* receive remaining proposal message */
  687. recvlen = datlen > SMC_CLC_RECV_BUF_LEN ?
  688. SMC_CLC_RECV_BUF_LEN : datlen;
  689. iov_iter_kvec(&msg.msg_iter, ITER_DEST, &vec, 1, recvlen);
  690. len = sock_recvmsg(smc->clcsock, &msg, krflags);
  691. if (len < recvlen) {
  692. smc->sk.sk_err = EPROTO;
  693. reason_code = -EPROTO;
  694. goto out;
  695. }
  696. datlen -= len;
  697. }
  698. if (clcm->type == SMC_CLC_DECLINE) {
  699. struct smc_clc_msg_decline *dclc;
  700. dclc = (struct smc_clc_msg_decline *)clcm;
  701. reason_code = SMC_CLC_DECL_PEERDECL;
  702. smc->peer_diagnosis = ntohl(dclc->peer_diagnosis);
  703. if (((struct smc_clc_msg_decline *)buf)->hdr.typev2 &
  704. SMC_FIRST_CONTACT_MASK) {
  705. smc->conn.lgr->sync_err = 1;
  706. smc_lgr_terminate_sched(smc->conn.lgr);
  707. }
  708. }
  709. out:
  710. WRITE_ONCE(clc_sk->sk_rcvtimeo, rcvtimeo);
  711. return reason_code;
  712. }
  713. /* send CLC DECLINE message across internal TCP socket */
  714. int smc_clc_send_decline(struct smc_sock *smc, u32 peer_diag_info, u8 version)
  715. {
  716. struct smc_clc_msg_decline *dclc_v1;
  717. struct smc_clc_msg_decline_v2 dclc;
  718. struct msghdr msg;
  719. int len, send_len;
  720. struct kvec vec;
  721. dclc_v1 = (struct smc_clc_msg_decline *)&dclc;
  722. memset(&dclc, 0, sizeof(dclc));
  723. memcpy(dclc.hdr.eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
  724. dclc.hdr.type = SMC_CLC_DECLINE;
  725. dclc.hdr.version = version;
  726. dclc.os_type = version == SMC_V1 ? 0 : SMC_CLC_OS_LINUX;
  727. dclc.hdr.typev2 = (peer_diag_info == SMC_CLC_DECL_SYNCERR) ?
  728. SMC_FIRST_CONTACT_MASK : 0;
  729. if ((!smc_conn_lgr_valid(&smc->conn) || !smc->conn.lgr->is_smcd) &&
  730. smc_ib_is_valid_local_systemid())
  731. memcpy(dclc.id_for_peer, local_systemid,
  732. sizeof(local_systemid));
  733. dclc.peer_diagnosis = htonl(peer_diag_info);
  734. if (version == SMC_V1) {
  735. memcpy(dclc_v1->trl.eyecatcher, SMC_EYECATCHER,
  736. sizeof(SMC_EYECATCHER));
  737. send_len = sizeof(*dclc_v1);
  738. } else {
  739. memcpy(dclc.trl.eyecatcher, SMC_EYECATCHER,
  740. sizeof(SMC_EYECATCHER));
  741. send_len = sizeof(dclc);
  742. }
  743. dclc.hdr.length = htons(send_len);
  744. memset(&msg, 0, sizeof(msg));
  745. vec.iov_base = &dclc;
  746. vec.iov_len = send_len;
  747. len = kernel_sendmsg(smc->clcsock, &msg, &vec, 1, send_len);
  748. if (len < 0 || len < send_len)
  749. len = -EPROTO;
  750. return len > 0 ? 0 : len;
  751. }
  752. /* send CLC PROPOSAL message across internal TCP socket */
  753. int smc_clc_send_proposal(struct smc_sock *smc, struct smc_init_info *ini)
  754. {
  755. struct smc_clc_smcd_v2_extension *smcd_v2_ext;
  756. struct smc_clc_msg_proposal_prefix *pclc_prfx;
  757. struct smc_clc_msg_proposal *pclc_base;
  758. struct smc_clc_smcd_gid_chid *gidchids;
  759. struct smc_clc_msg_proposal_area *pclc;
  760. struct smc_clc_ipv6_prefix *ipv6_prfx;
  761. struct net *net = sock_net(&smc->sk);
  762. struct smc_clc_v2_extension *v2_ext;
  763. struct smc_clc_msg_smcd *pclc_smcd;
  764. struct smc_clc_msg_trail *trl;
  765. struct smcd_dev *smcd;
  766. int len, i, plen, rc;
  767. int reason_code = 0;
  768. struct kvec vec[8];
  769. struct msghdr msg;
  770. pclc = kzalloc_obj(*pclc);
  771. if (!pclc)
  772. return -ENOMEM;
  773. pclc_base = &pclc->pclc_base;
  774. pclc_smcd = &pclc->pclc_smcd;
  775. pclc_prfx = &pclc->pclc_prfx;
  776. ipv6_prfx = pclc->pclc_prfx_ipv6;
  777. v2_ext = container_of(&pclc->pclc_v2_ext,
  778. struct smc_clc_v2_extension, fixed);
  779. smcd_v2_ext = container_of(&pclc->pclc_smcd_v2_ext,
  780. struct smc_clc_smcd_v2_extension, fixed);
  781. gidchids = pclc->pclc_gidchids;
  782. trl = &pclc->pclc_trl;
  783. pclc_base->hdr.version = SMC_V2;
  784. pclc_base->hdr.typev1 = ini->smc_type_v1;
  785. pclc_base->hdr.typev2 = ini->smc_type_v2;
  786. plen = sizeof(*pclc_base) + sizeof(*pclc_smcd) + sizeof(*trl);
  787. /* retrieve ip prefixes for CLC proposal msg */
  788. if (ini->smc_type_v1 != SMC_TYPE_N) {
  789. rc = smc_clc_prfx_set(smc->clcsock, pclc_prfx, ipv6_prfx);
  790. if (rc) {
  791. if (ini->smc_type_v2 == SMC_TYPE_N) {
  792. kfree(pclc);
  793. return SMC_CLC_DECL_CNFERR;
  794. }
  795. pclc_base->hdr.typev1 = SMC_TYPE_N;
  796. ini->smc_type_v1 = SMC_TYPE_N;
  797. } else {
  798. pclc_base->iparea_offset = htons(sizeof(*pclc_smcd));
  799. plen += sizeof(*pclc_prfx) +
  800. pclc_prfx->ipv6_prefixes_cnt *
  801. sizeof(ipv6_prfx[0]);
  802. }
  803. }
  804. /* build SMC Proposal CLC message */
  805. memcpy(pclc_base->hdr.eyecatcher, SMC_EYECATCHER,
  806. sizeof(SMC_EYECATCHER));
  807. pclc_base->hdr.type = SMC_CLC_PROPOSAL;
  808. if (smcr_indicated(ini->smc_type_v1)) {
  809. /* add SMC-R specifics */
  810. memcpy(pclc_base->lcl.id_for_peer, local_systemid,
  811. sizeof(local_systemid));
  812. memcpy(pclc_base->lcl.gid, ini->ib_gid, SMC_GID_SIZE);
  813. memcpy(pclc_base->lcl.mac, &ini->ib_dev->mac[ini->ib_port - 1],
  814. ETH_ALEN);
  815. }
  816. if (smcd_indicated(ini->smc_type_v1)) {
  817. struct smcd_gid smcd_gid;
  818. /* add SMC-D specifics */
  819. if (ini->ism_dev[0]) {
  820. smcd = ini->ism_dev[0];
  821. copy_to_smcdgid(&smcd_gid, &smcd->dibs->gid);
  822. pclc_smcd->ism.gid = htonll(smcd_gid.gid);
  823. pclc_smcd->ism.chid =
  824. htons(smc_ism_get_chid(ini->ism_dev[0]));
  825. }
  826. }
  827. if (ini->smc_type_v2 == SMC_TYPE_N) {
  828. pclc_smcd->v2_ext_offset = 0;
  829. } else {
  830. struct smc_clc_eid_entry *ueident;
  831. u16 v2_ext_offset;
  832. v2_ext->hdr.flag.release = SMC_RELEASE;
  833. v2_ext_offset = sizeof(*pclc_smcd) -
  834. offsetofend(struct smc_clc_msg_smcd, v2_ext_offset);
  835. if (ini->smc_type_v1 != SMC_TYPE_N)
  836. v2_ext_offset += sizeof(*pclc_prfx) +
  837. pclc_prfx->ipv6_prefixes_cnt *
  838. sizeof(ipv6_prfx[0]);
  839. pclc_smcd->v2_ext_offset = htons(v2_ext_offset);
  840. plen += sizeof(*v2_ext);
  841. v2_ext->feature_mask = htons(SMC_FEATURE_MASK);
  842. read_lock(&smc_clc_eid_table.lock);
  843. v2_ext->hdr.eid_cnt = smc_clc_eid_table.ueid_cnt;
  844. plen += smc_clc_eid_table.ueid_cnt * SMC_MAX_EID_LEN;
  845. i = 0;
  846. list_for_each_entry(ueident, &smc_clc_eid_table.list, list) {
  847. memcpy(v2_ext->user_eids[i++], ueident->eid,
  848. sizeof(ueident->eid));
  849. }
  850. read_unlock(&smc_clc_eid_table.lock);
  851. }
  852. if (smcd_indicated(ini->smc_type_v2)) {
  853. struct smcd_gid smcd_gid;
  854. u8 *eid = NULL;
  855. int entry = 0;
  856. v2_ext->hdr.flag.seid = smc_clc_eid_table.seid_enabled;
  857. v2_ext->hdr.smcd_v2_ext_offset = htons(sizeof(*v2_ext) -
  858. offsetofend(struct smc_clnt_opts_area_hdr,
  859. smcd_v2_ext_offset) +
  860. v2_ext->hdr.eid_cnt * SMC_MAX_EID_LEN);
  861. smc_ism_get_system_eid(&eid);
  862. if (eid && v2_ext->hdr.flag.seid)
  863. memcpy(smcd_v2_ext->system_eid, eid, SMC_MAX_EID_LEN);
  864. plen += sizeof(*smcd_v2_ext);
  865. if (ini->ism_offered_cnt) {
  866. for (i = 1; i <= ini->ism_offered_cnt; i++) {
  867. smcd = ini->ism_dev[i];
  868. copy_to_smcdgid(&smcd_gid, &smcd->dibs->gid);
  869. gidchids[entry].chid =
  870. htons(smc_ism_get_chid(ini->ism_dev[i]));
  871. gidchids[entry].gid = htonll(smcd_gid.gid);
  872. if (smc_ism_is_emulated(smcd)) {
  873. /* an Emulated-ISM device takes two
  874. * entries. CHID of the second entry
  875. * repeats that of the first entry.
  876. */
  877. gidchids[entry + 1].chid =
  878. gidchids[entry].chid;
  879. gidchids[entry + 1].gid =
  880. htonll(smcd_gid.gid_ext);
  881. entry++;
  882. }
  883. entry++;
  884. }
  885. plen += entry * sizeof(struct smc_clc_smcd_gid_chid);
  886. }
  887. v2_ext->hdr.ism_gid_cnt = entry;
  888. }
  889. if (smcr_indicated(ini->smc_type_v2)) {
  890. memcpy(v2_ext->roce, ini->smcrv2.ib_gid_v2, SMC_GID_SIZE);
  891. v2_ext->max_conns = net->smc.sysctl_max_conns_per_lgr;
  892. v2_ext->max_links = net->smc.sysctl_max_links_per_lgr;
  893. }
  894. pclc_base->hdr.length = htons(plen);
  895. memcpy(trl->eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
  896. /* send SMC Proposal CLC message */
  897. memset(&msg, 0, sizeof(msg));
  898. i = 0;
  899. vec[i].iov_base = pclc_base;
  900. vec[i++].iov_len = sizeof(*pclc_base);
  901. vec[i].iov_base = pclc_smcd;
  902. vec[i++].iov_len = sizeof(*pclc_smcd);
  903. if (ini->smc_type_v1 != SMC_TYPE_N) {
  904. vec[i].iov_base = pclc_prfx;
  905. vec[i++].iov_len = sizeof(*pclc_prfx);
  906. if (pclc_prfx->ipv6_prefixes_cnt > 0) {
  907. vec[i].iov_base = ipv6_prfx;
  908. vec[i++].iov_len = pclc_prfx->ipv6_prefixes_cnt *
  909. sizeof(ipv6_prfx[0]);
  910. }
  911. }
  912. if (ini->smc_type_v2 != SMC_TYPE_N) {
  913. vec[i].iov_base = v2_ext;
  914. vec[i++].iov_len = sizeof(*v2_ext) +
  915. (v2_ext->hdr.eid_cnt * SMC_MAX_EID_LEN);
  916. if (smcd_indicated(ini->smc_type_v2)) {
  917. vec[i].iov_base = smcd_v2_ext;
  918. vec[i++].iov_len = sizeof(*smcd_v2_ext);
  919. if (ini->ism_offered_cnt) {
  920. vec[i].iov_base = gidchids;
  921. vec[i++].iov_len = v2_ext->hdr.ism_gid_cnt *
  922. sizeof(struct smc_clc_smcd_gid_chid);
  923. }
  924. }
  925. }
  926. vec[i].iov_base = trl;
  927. vec[i++].iov_len = sizeof(*trl);
  928. /* due to the few bytes needed for clc-handshake this cannot block */
  929. len = kernel_sendmsg(smc->clcsock, &msg, vec, i, plen);
  930. if (len < 0) {
  931. smc->sk.sk_err = smc->clcsock->sk->sk_err;
  932. reason_code = -smc->sk.sk_err;
  933. } else if (len < ntohs(pclc_base->hdr.length)) {
  934. reason_code = -ENETUNREACH;
  935. smc->sk.sk_err = -reason_code;
  936. }
  937. kfree(pclc);
  938. return reason_code;
  939. }
  940. static void
  941. smcd_clc_prep_confirm_accept(struct smc_connection *conn,
  942. struct smc_clc_msg_accept_confirm *clc,
  943. int first_contact, u8 version,
  944. u8 *eid, struct smc_init_info *ini,
  945. int *fce_len,
  946. struct smc_clc_first_contact_ext_v2x *fce_v2x,
  947. struct smc_clc_msg_trail *trl)
  948. {
  949. struct smcd_dev *smcd = conn->lgr->smcd;
  950. struct smcd_gid smcd_gid;
  951. u16 chid;
  952. int len;
  953. /* SMC-D specific settings */
  954. memcpy(clc->hdr.eyecatcher, SMCD_EYECATCHER,
  955. sizeof(SMCD_EYECATCHER));
  956. copy_to_smcdgid(&smcd_gid, &smcd->dibs->gid);
  957. clc->hdr.typev1 = SMC_TYPE_D;
  958. clc->d0.gid = htonll(smcd_gid.gid);
  959. clc->d0.token = htonll(conn->rmb_desc->token);
  960. clc->d0.dmbe_size = conn->rmbe_size_comp;
  961. clc->d0.dmbe_idx = 0;
  962. memcpy(&clc->d0.linkid, conn->lgr->id, SMC_LGR_ID_SIZE);
  963. if (version == SMC_V1) {
  964. clc->hdr.length = htons(SMCD_CLC_ACCEPT_CONFIRM_LEN);
  965. } else {
  966. chid = smc_ism_get_chid(smcd);
  967. clc->d1.chid = htons(chid);
  968. if (eid && eid[0])
  969. memcpy(clc->d1.eid, eid, SMC_MAX_EID_LEN);
  970. if (__smc_ism_is_emulated(chid))
  971. clc->d1.gid_ext = htonll(smcd_gid.gid_ext);
  972. len = SMCD_CLC_ACCEPT_CONFIRM_LEN_V2;
  973. if (first_contact) {
  974. *fce_len = smc_clc_fill_fce_v2x(fce_v2x, ini);
  975. len += *fce_len;
  976. }
  977. clc->hdr.length = htons(len);
  978. }
  979. memcpy(trl->eyecatcher, SMCD_EYECATCHER,
  980. sizeof(SMCD_EYECATCHER));
  981. }
  982. static void
  983. smcr_clc_prep_confirm_accept(struct smc_connection *conn,
  984. struct smc_clc_msg_accept_confirm *clc,
  985. int first_contact, u8 version,
  986. u8 *eid, struct smc_init_info *ini,
  987. int *fce_len,
  988. struct smc_clc_first_contact_ext_v2x *fce_v2x,
  989. struct smc_clc_fce_gid_ext *gle,
  990. struct smc_clc_msg_trail *trl)
  991. {
  992. struct smc_link *link = conn->lnk;
  993. int len;
  994. /* SMC-R specific settings */
  995. memcpy(clc->hdr.eyecatcher, SMC_EYECATCHER,
  996. sizeof(SMC_EYECATCHER));
  997. clc->hdr.typev1 = SMC_TYPE_R;
  998. memcpy(clc->r0.lcl.id_for_peer, local_systemid,
  999. sizeof(local_systemid));
  1000. memcpy(&clc->r0.lcl.gid, link->gid, SMC_GID_SIZE);
  1001. memcpy(&clc->r0.lcl.mac, &link->smcibdev->mac[link->ibport - 1],
  1002. ETH_ALEN);
  1003. hton24(clc->r0.qpn, link->roce_qp->qp_num);
  1004. clc->r0.rmb_rkey =
  1005. htonl(conn->rmb_desc->mr[link->link_idx]->rkey);
  1006. clc->r0.rmbe_idx = 1; /* for now: 1 RMB = 1 RMBE */
  1007. clc->r0.rmbe_alert_token = htonl(conn->alert_token_local);
  1008. switch (clc->hdr.type) {
  1009. case SMC_CLC_ACCEPT:
  1010. clc->r0.qp_mtu = link->path_mtu;
  1011. break;
  1012. case SMC_CLC_CONFIRM:
  1013. clc->r0.qp_mtu = min(link->path_mtu, link->peer_mtu);
  1014. break;
  1015. }
  1016. clc->r0.rmbe_size = conn->rmbe_size_comp;
  1017. clc->r0.rmb_dma_addr = conn->rmb_desc->is_vm ?
  1018. cpu_to_be64((uintptr_t)conn->rmb_desc->cpu_addr) :
  1019. cpu_to_be64((u64)sg_dma_address
  1020. (conn->rmb_desc->sgt[link->link_idx].sgl));
  1021. hton24(clc->r0.psn, link->psn_initial);
  1022. if (version == SMC_V1) {
  1023. clc->hdr.length = htons(SMCR_CLC_ACCEPT_CONFIRM_LEN);
  1024. } else {
  1025. if (eid && eid[0])
  1026. memcpy(clc->r1.eid, eid, SMC_MAX_EID_LEN);
  1027. len = SMCR_CLC_ACCEPT_CONFIRM_LEN_V2;
  1028. if (first_contact) {
  1029. *fce_len = smc_clc_fill_fce_v2x(fce_v2x, ini);
  1030. len += *fce_len;
  1031. fce_v2x->fce_v2_base.v2_direct =
  1032. !link->lgr->uses_gateway;
  1033. if (clc->hdr.type == SMC_CLC_CONFIRM) {
  1034. memset(gle, 0, sizeof(*gle));
  1035. gle->gid_cnt = ini->smcrv2.gidlist.len;
  1036. len += sizeof(*gle);
  1037. len += gle->gid_cnt * sizeof(gle->gid[0]);
  1038. }
  1039. }
  1040. clc->hdr.length = htons(len);
  1041. }
  1042. memcpy(trl->eyecatcher, SMC_EYECATCHER, sizeof(SMC_EYECATCHER));
  1043. }
  1044. /* build and send CLC CONFIRM / ACCEPT message */
  1045. static int smc_clc_send_confirm_accept(struct smc_sock *smc,
  1046. struct smc_clc_msg_accept_confirm *clc,
  1047. int first_contact, u8 version,
  1048. u8 *eid, struct smc_init_info *ini)
  1049. {
  1050. struct smc_clc_first_contact_ext_v2x fce_v2x;
  1051. struct smc_connection *conn = &smc->conn;
  1052. struct smc_clc_fce_gid_ext gle;
  1053. struct smc_clc_msg_trail trl;
  1054. int i, fce_len;
  1055. struct kvec vec[5];
  1056. struct msghdr msg;
  1057. /* send SMC Confirm CLC msg */
  1058. clc->hdr.version = version; /* SMC version */
  1059. if (first_contact)
  1060. clc->hdr.typev2 |= SMC_FIRST_CONTACT_MASK;
  1061. if (conn->lgr->is_smcd)
  1062. smcd_clc_prep_confirm_accept(conn, clc, first_contact,
  1063. version, eid, ini, &fce_len,
  1064. &fce_v2x, &trl);
  1065. else
  1066. smcr_clc_prep_confirm_accept(conn, clc, first_contact,
  1067. version, eid, ini, &fce_len,
  1068. &fce_v2x, &gle, &trl);
  1069. memset(&msg, 0, sizeof(msg));
  1070. i = 0;
  1071. vec[i].iov_base = clc;
  1072. if (version > SMC_V1)
  1073. vec[i++].iov_len = (clc->hdr.typev1 == SMC_TYPE_D ?
  1074. SMCD_CLC_ACCEPT_CONFIRM_LEN_V2 :
  1075. SMCR_CLC_ACCEPT_CONFIRM_LEN_V2) -
  1076. sizeof(trl);
  1077. else
  1078. vec[i++].iov_len = (clc->hdr.typev1 == SMC_TYPE_D ?
  1079. SMCD_CLC_ACCEPT_CONFIRM_LEN :
  1080. SMCR_CLC_ACCEPT_CONFIRM_LEN) -
  1081. sizeof(trl);
  1082. if (version > SMC_V1 && first_contact) {
  1083. vec[i].iov_base = &fce_v2x;
  1084. vec[i++].iov_len = fce_len;
  1085. if (!conn->lgr->is_smcd) {
  1086. if (clc->hdr.type == SMC_CLC_CONFIRM) {
  1087. vec[i].iov_base = &gle;
  1088. vec[i++].iov_len = sizeof(gle);
  1089. vec[i].iov_base = &ini->smcrv2.gidlist.list;
  1090. vec[i++].iov_len = gle.gid_cnt *
  1091. sizeof(gle.gid[0]);
  1092. }
  1093. }
  1094. }
  1095. vec[i].iov_base = &trl;
  1096. vec[i++].iov_len = sizeof(trl);
  1097. return kernel_sendmsg(smc->clcsock, &msg, vec, 1,
  1098. ntohs(clc->hdr.length));
  1099. }
  1100. /* send CLC CONFIRM message across internal TCP socket */
  1101. int smc_clc_send_confirm(struct smc_sock *smc, bool clnt_first_contact,
  1102. u8 version, u8 *eid, struct smc_init_info *ini)
  1103. {
  1104. struct smc_clc_msg_accept_confirm cclc;
  1105. int reason_code = 0;
  1106. int len;
  1107. /* send SMC Confirm CLC msg */
  1108. memset(&cclc, 0, sizeof(cclc));
  1109. cclc.hdr.type = SMC_CLC_CONFIRM;
  1110. len = smc_clc_send_confirm_accept(smc, &cclc, clnt_first_contact,
  1111. version, eid, ini);
  1112. if (len < ntohs(cclc.hdr.length)) {
  1113. if (len >= 0) {
  1114. reason_code = -ENETUNREACH;
  1115. smc->sk.sk_err = -reason_code;
  1116. } else {
  1117. smc->sk.sk_err = smc->clcsock->sk->sk_err;
  1118. reason_code = -smc->sk.sk_err;
  1119. }
  1120. }
  1121. return reason_code;
  1122. }
  1123. /* send CLC ACCEPT message across internal TCP socket */
  1124. int smc_clc_send_accept(struct smc_sock *new_smc, bool srv_first_contact,
  1125. u8 version, u8 *negotiated_eid, struct smc_init_info *ini)
  1126. {
  1127. struct smc_clc_msg_accept_confirm aclc;
  1128. int len;
  1129. memset(&aclc, 0, sizeof(aclc));
  1130. aclc.hdr.type = SMC_CLC_ACCEPT;
  1131. len = smc_clc_send_confirm_accept(new_smc, &aclc, srv_first_contact,
  1132. version, negotiated_eid, ini);
  1133. if (len < ntohs(aclc.hdr.length))
  1134. len = len >= 0 ? -EPROTO : -new_smc->clcsock->sk->sk_err;
  1135. return len > 0 ? 0 : len;
  1136. }
  1137. int smc_clc_srv_v2x_features_validate(struct smc_sock *smc,
  1138. struct smc_clc_msg_proposal *pclc,
  1139. struct smc_init_info *ini)
  1140. {
  1141. struct smc_clc_v2_extension *pclc_v2_ext;
  1142. struct net *net = sock_net(&smc->sk);
  1143. ini->max_conns = SMC_CONN_PER_LGR_MAX;
  1144. ini->max_links = SMC_LINKS_ADD_LNK_MAX;
  1145. ini->feature_mask = SMC_FEATURE_MASK;
  1146. if ((!(ini->smcd_version & SMC_V2) && !(ini->smcr_version & SMC_V2)) ||
  1147. ini->release_nr < SMC_RELEASE_1)
  1148. return 0;
  1149. pclc_v2_ext = smc_get_clc_v2_ext(pclc);
  1150. if (!pclc_v2_ext)
  1151. return SMC_CLC_DECL_NOV2EXT;
  1152. if (ini->smcr_version & SMC_V2) {
  1153. ini->max_conns = min_t(u8, pclc_v2_ext->max_conns,
  1154. net->smc.sysctl_max_conns_per_lgr);
  1155. if (ini->max_conns < SMC_CONN_PER_LGR_MIN)
  1156. return SMC_CLC_DECL_MAXCONNERR;
  1157. ini->max_links = min_t(u8, pclc_v2_ext->max_links,
  1158. net->smc.sysctl_max_links_per_lgr);
  1159. if (ini->max_links < SMC_LINKS_ADD_LNK_MIN)
  1160. return SMC_CLC_DECL_MAXLINKERR;
  1161. }
  1162. return 0;
  1163. }
  1164. int smc_clc_clnt_v2x_features_validate(struct smc_clc_first_contact_ext *fce,
  1165. struct smc_init_info *ini)
  1166. {
  1167. struct smc_clc_first_contact_ext_v2x *fce_v2x =
  1168. (struct smc_clc_first_contact_ext_v2x *)fce;
  1169. if (ini->release_nr < SMC_RELEASE_1)
  1170. return 0;
  1171. if (!ini->is_smcd) {
  1172. if (fce_v2x->max_conns < SMC_CONN_PER_LGR_MIN)
  1173. return SMC_CLC_DECL_MAXCONNERR;
  1174. ini->max_conns = fce_v2x->max_conns;
  1175. if (fce_v2x->max_links > SMC_LINKS_ADD_LNK_MAX ||
  1176. fce_v2x->max_links < SMC_LINKS_ADD_LNK_MIN)
  1177. return SMC_CLC_DECL_MAXLINKERR;
  1178. ini->max_links = fce_v2x->max_links;
  1179. }
  1180. /* common supplemental features of server and client */
  1181. ini->feature_mask = ntohs(fce_v2x->feature_mask) & SMC_FEATURE_MASK;
  1182. return 0;
  1183. }
  1184. int smc_clc_v2x_features_confirm_check(struct smc_clc_msg_accept_confirm *cclc,
  1185. struct smc_init_info *ini)
  1186. {
  1187. struct smc_clc_first_contact_ext *fce =
  1188. smc_get_clc_first_contact_ext(cclc, ini->is_smcd);
  1189. struct smc_clc_first_contact_ext_v2x *fce_v2x =
  1190. (struct smc_clc_first_contact_ext_v2x *)fce;
  1191. if (cclc->hdr.version == SMC_V1 ||
  1192. !(cclc->hdr.typev2 & SMC_FIRST_CONTACT_MASK))
  1193. return 0;
  1194. if (ini->release_nr != fce->release)
  1195. return SMC_CLC_DECL_RELEASEERR;
  1196. if (fce->release < SMC_RELEASE_1)
  1197. return 0;
  1198. if (!ini->is_smcd) {
  1199. if (fce_v2x->max_conns != ini->max_conns)
  1200. return SMC_CLC_DECL_MAXCONNERR;
  1201. if (fce_v2x->max_links != ini->max_links)
  1202. return SMC_CLC_DECL_MAXLINKERR;
  1203. }
  1204. /* common supplemental features returned by client */
  1205. ini->feature_mask = ntohs(fce_v2x->feature_mask);
  1206. return 0;
  1207. }
  1208. void smc_clc_get_hostname(u8 **host)
  1209. {
  1210. *host = &smc_hostname[0];
  1211. }
  1212. void __init smc_clc_init(void)
  1213. {
  1214. struct new_utsname *u;
  1215. memset(smc_hostname, _S, sizeof(smc_hostname)); /* ASCII blanks */
  1216. u = utsname();
  1217. memcpy(smc_hostname, u->nodename,
  1218. min_t(size_t, strlen(u->nodename), sizeof(smc_hostname)));
  1219. INIT_LIST_HEAD(&smc_clc_eid_table.list);
  1220. rwlock_init(&smc_clc_eid_table.lock);
  1221. smc_clc_eid_table.ueid_cnt = 0;
  1222. #if IS_ENABLED(CONFIG_S390)
  1223. smc_clc_eid_table.seid_enabled = 1;
  1224. #else
  1225. smc_clc_eid_table.seid_enabled = 0;
  1226. #endif
  1227. }
  1228. void smc_clc_exit(void)
  1229. {
  1230. smc_clc_ueid_remove(NULL);
  1231. }