target_core_user.c 86 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393
  1. // SPDX-License-Identifier: GPL-2.0-only
  2. /*
  3. * Copyright (C) 2013 Shaohua Li <shli@kernel.org>
  4. * Copyright (C) 2014 Red Hat, Inc.
  5. * Copyright (C) 2015 Arrikto, Inc.
  6. * Copyright (C) 2017 Chinamobile, Inc.
  7. */
  8. #include <linux/spinlock.h>
  9. #include <linux/module.h>
  10. #include <linux/kernel.h>
  11. #include <linux/timer.h>
  12. #include <linux/parser.h>
  13. #include <linux/vmalloc.h>
  14. #include <linux/uio_driver.h>
  15. #include <linux/xarray.h>
  16. #include <linux/stringify.h>
  17. #include <linux/bitops.h>
  18. #include <linux/highmem.h>
  19. #include <linux/configfs.h>
  20. #include <linux/mutex.h>
  21. #include <linux/workqueue.h>
  22. #include <linux/pagemap.h>
  23. #include <net/genetlink.h>
  24. #include <scsi/scsi_common.h>
  25. #include <scsi/scsi_proto.h>
  26. #include <target/target_core_base.h>
  27. #include <target/target_core_fabric.h>
  28. #include <target/target_core_backend.h>
  29. #include <linux/target_core_user.h>
  30. /**
  31. * DOC: Userspace I/O
  32. * Userspace I/O
  33. * -------------
  34. *
  35. * Define a shared-memory interface for LIO to pass SCSI commands and
  36. * data to userspace for processing. This is to allow backends that
  37. * are too complex for in-kernel support to be possible.
  38. *
  39. * It uses the UIO framework to do a lot of the device-creation and
  40. * introspection work for us.
  41. *
  42. * See the .h file for how the ring is laid out. Note that while the
  43. * command ring is defined, the particulars of the data area are
  44. * not. Offset values in the command entry point to other locations
  45. * internal to the mmap-ed area. There is separate space outside the
  46. * command ring for data buffers. This leaves maximum flexibility for
  47. * moving buffer allocations, or even page flipping or other
  48. * allocation techniques, without altering the command ring layout.
  49. *
  50. * SECURITY:
  51. * The user process must be assumed to be malicious. There's no way to
  52. * prevent it breaking the command ring protocol if it wants, but in
  53. * order to prevent other issues we must only ever read *data* from
  54. * the shared memory area, not offsets or sizes. This applies to
  55. * command ring entries as well as the mailbox. Extra code needed for
  56. * this may have a 'UAM' comment.
  57. */
  58. #define TCMU_TIME_OUT (30 * MSEC_PER_SEC)
  59. /* For mailbox plus cmd ring, the size is fixed 8MB */
  60. #define MB_CMDR_SIZE_DEF (8 * 1024 * 1024)
  61. /* Offset of cmd ring is size of mailbox */
  62. #define CMDR_OFF ((__u32)sizeof(struct tcmu_mailbox))
  63. #define CMDR_SIZE_DEF (MB_CMDR_SIZE_DEF - CMDR_OFF)
  64. /*
  65. * For data area, the default block size is PAGE_SIZE and
  66. * the default total size is 256K * PAGE_SIZE.
  67. */
  68. #define DATA_PAGES_PER_BLK_DEF 1
  69. #define DATA_AREA_PAGES_DEF (256 * 1024)
  70. #define TCMU_MBS_TO_PAGES(_mbs) ((size_t)_mbs << (20 - PAGE_SHIFT))
  71. #define TCMU_PAGES_TO_MBS(_pages) (_pages >> (20 - PAGE_SHIFT))
  72. /*
  73. * Default number of global data blocks(512K * PAGE_SIZE)
  74. * when the unmap thread will be started.
  75. */
  76. #define TCMU_GLOBAL_MAX_PAGES_DEF (512 * 1024)
  77. static u8 tcmu_kern_cmd_reply_supported;
  78. static u8 tcmu_netlink_blocked;
  79. static struct device *tcmu_root_device;
  80. struct tcmu_hba {
  81. u32 host_id;
  82. };
  83. #define TCMU_CONFIG_LEN 256
  84. static DEFINE_MUTEX(tcmu_nl_cmd_mutex);
  85. static LIST_HEAD(tcmu_nl_cmd_list);
  86. struct tcmu_dev;
  87. struct tcmu_nl_cmd {
  88. /* wake up thread waiting for reply */
  89. struct completion complete;
  90. struct list_head nl_list;
  91. struct tcmu_dev *udev;
  92. int cmd;
  93. int status;
  94. };
  95. struct tcmu_dev {
  96. struct list_head node;
  97. struct kref kref;
  98. struct se_device se_dev;
  99. struct se_dev_plug se_plug;
  100. char *name;
  101. struct se_hba *hba;
  102. #define TCMU_DEV_BIT_OPEN 0
  103. #define TCMU_DEV_BIT_BROKEN 1
  104. #define TCMU_DEV_BIT_BLOCKED 2
  105. #define TCMU_DEV_BIT_TMR_NOTIFY 3
  106. #define TCMU_DEV_BIT_PLUGGED 4
  107. unsigned long flags;
  108. struct uio_info uio_info;
  109. struct inode *inode;
  110. uint64_t dev_size;
  111. struct tcmu_mailbox *mb_addr;
  112. void *cmdr;
  113. u32 cmdr_size;
  114. u32 cmdr_last_cleaned;
  115. /* Offset of data area from start of mb */
  116. /* Must add data_off and mb_addr to get the address */
  117. size_t data_off;
  118. int data_area_mb;
  119. uint32_t max_blocks;
  120. size_t mmap_pages;
  121. struct mutex cmdr_lock;
  122. struct list_head qfull_queue;
  123. struct list_head tmr_queue;
  124. uint32_t dbi_max;
  125. uint32_t dbi_thresh;
  126. unsigned long *data_bitmap;
  127. struct xarray data_pages;
  128. uint32_t data_pages_per_blk;
  129. uint32_t data_blk_size;
  130. struct xarray commands;
  131. struct timer_list cmd_timer;
  132. unsigned int cmd_time_out;
  133. struct list_head inflight_queue;
  134. struct timer_list qfull_timer;
  135. int qfull_time_out;
  136. struct list_head timedout_entry;
  137. struct tcmu_nl_cmd curr_nl_cmd;
  138. char dev_config[TCMU_CONFIG_LEN];
  139. int nl_reply_supported;
  140. };
  141. #define TCMU_DEV(_se_dev) container_of(_se_dev, struct tcmu_dev, se_dev)
  142. struct tcmu_cmd {
  143. struct se_cmd *se_cmd;
  144. struct tcmu_dev *tcmu_dev;
  145. struct list_head queue_entry;
  146. uint16_t cmd_id;
  147. /* Can't use se_cmd when cleaning up expired cmds, because if
  148. cmd has been completed then accessing se_cmd is off limits */
  149. uint32_t dbi_cnt;
  150. uint32_t dbi_bidi_cnt;
  151. uint32_t dbi_cur;
  152. uint32_t *dbi;
  153. uint32_t data_len_bidi;
  154. unsigned long deadline;
  155. #define TCMU_CMD_BIT_EXPIRED 0
  156. #define TCMU_CMD_BIT_KEEP_BUF 1
  157. unsigned long flags;
  158. };
  159. struct tcmu_tmr {
  160. struct list_head queue_entry;
  161. uint8_t tmr_type;
  162. uint32_t tmr_cmd_cnt;
  163. int16_t tmr_cmd_ids[] __counted_by(tmr_cmd_cnt);
  164. };
  165. /*
  166. * To avoid dead lock the mutex lock order should always be:
  167. *
  168. * mutex_lock(&root_udev_mutex);
  169. * ...
  170. * mutex_lock(&tcmu_dev->cmdr_lock);
  171. * mutex_unlock(&tcmu_dev->cmdr_lock);
  172. * ...
  173. * mutex_unlock(&root_udev_mutex);
  174. */
  175. static DEFINE_MUTEX(root_udev_mutex);
  176. static LIST_HEAD(root_udev);
  177. static DEFINE_SPINLOCK(timed_out_udevs_lock);
  178. static LIST_HEAD(timed_out_udevs);
  179. static struct kmem_cache *tcmu_cmd_cache;
  180. static atomic_t global_page_count = ATOMIC_INIT(0);
  181. static struct delayed_work tcmu_unmap_work;
  182. static int tcmu_global_max_pages = TCMU_GLOBAL_MAX_PAGES_DEF;
  183. static int tcmu_set_global_max_data_area(const char *str,
  184. const struct kernel_param *kp)
  185. {
  186. int ret, max_area_mb;
  187. ret = kstrtoint(str, 10, &max_area_mb);
  188. if (ret)
  189. return -EINVAL;
  190. if (max_area_mb <= 0) {
  191. pr_err("global_max_data_area must be larger than 0.\n");
  192. return -EINVAL;
  193. }
  194. tcmu_global_max_pages = TCMU_MBS_TO_PAGES(max_area_mb);
  195. if (atomic_read(&global_page_count) > tcmu_global_max_pages)
  196. schedule_delayed_work(&tcmu_unmap_work, 0);
  197. else
  198. cancel_delayed_work_sync(&tcmu_unmap_work);
  199. return 0;
  200. }
  201. static int tcmu_get_global_max_data_area(char *buffer,
  202. const struct kernel_param *kp)
  203. {
  204. return sprintf(buffer, "%d\n", TCMU_PAGES_TO_MBS(tcmu_global_max_pages));
  205. }
  206. static const struct kernel_param_ops tcmu_global_max_data_area_op = {
  207. .set = tcmu_set_global_max_data_area,
  208. .get = tcmu_get_global_max_data_area,
  209. };
  210. module_param_cb(global_max_data_area_mb, &tcmu_global_max_data_area_op, NULL,
  211. S_IWUSR | S_IRUGO);
  212. MODULE_PARM_DESC(global_max_data_area_mb,
  213. "Max MBs allowed to be allocated to all the tcmu device's "
  214. "data areas.");
  215. static int tcmu_get_block_netlink(char *buffer,
  216. const struct kernel_param *kp)
  217. {
  218. return sprintf(buffer, "%s\n", tcmu_netlink_blocked ?
  219. "blocked" : "unblocked");
  220. }
  221. static int tcmu_set_block_netlink(const char *str,
  222. const struct kernel_param *kp)
  223. {
  224. int ret;
  225. u8 val;
  226. ret = kstrtou8(str, 0, &val);
  227. if (ret < 0)
  228. return ret;
  229. if (val > 1) {
  230. pr_err("Invalid block netlink value %u\n", val);
  231. return -EINVAL;
  232. }
  233. tcmu_netlink_blocked = val;
  234. return 0;
  235. }
  236. static const struct kernel_param_ops tcmu_block_netlink_op = {
  237. .set = tcmu_set_block_netlink,
  238. .get = tcmu_get_block_netlink,
  239. };
  240. module_param_cb(block_netlink, &tcmu_block_netlink_op, NULL, S_IWUSR | S_IRUGO);
  241. MODULE_PARM_DESC(block_netlink, "Block new netlink commands.");
  242. static int tcmu_fail_netlink_cmd(struct tcmu_nl_cmd *nl_cmd)
  243. {
  244. struct tcmu_dev *udev = nl_cmd->udev;
  245. if (!tcmu_netlink_blocked) {
  246. pr_err("Could not reset device's netlink interface. Netlink is not blocked.\n");
  247. return -EBUSY;
  248. }
  249. if (nl_cmd->cmd != TCMU_CMD_UNSPEC) {
  250. pr_debug("Aborting nl cmd %d on %s\n", nl_cmd->cmd, udev->name);
  251. nl_cmd->status = -EINTR;
  252. list_del(&nl_cmd->nl_list);
  253. complete(&nl_cmd->complete);
  254. }
  255. return 0;
  256. }
  257. static int tcmu_set_reset_netlink(const char *str,
  258. const struct kernel_param *kp)
  259. {
  260. struct tcmu_nl_cmd *nl_cmd, *tmp_cmd;
  261. int ret;
  262. u8 val;
  263. ret = kstrtou8(str, 0, &val);
  264. if (ret < 0)
  265. return ret;
  266. if (val != 1) {
  267. pr_err("Invalid reset netlink value %u\n", val);
  268. return -EINVAL;
  269. }
  270. mutex_lock(&tcmu_nl_cmd_mutex);
  271. list_for_each_entry_safe(nl_cmd, tmp_cmd, &tcmu_nl_cmd_list, nl_list) {
  272. ret = tcmu_fail_netlink_cmd(nl_cmd);
  273. if (ret)
  274. break;
  275. }
  276. mutex_unlock(&tcmu_nl_cmd_mutex);
  277. return ret;
  278. }
  279. static const struct kernel_param_ops tcmu_reset_netlink_op = {
  280. .set = tcmu_set_reset_netlink,
  281. };
  282. module_param_cb(reset_netlink, &tcmu_reset_netlink_op, NULL, S_IWUSR);
  283. MODULE_PARM_DESC(reset_netlink, "Reset netlink commands.");
  284. /* multicast group */
  285. enum tcmu_multicast_groups {
  286. TCMU_MCGRP_CONFIG,
  287. };
  288. static const struct genl_multicast_group tcmu_mcgrps[] = {
  289. [TCMU_MCGRP_CONFIG] = { .name = "config", },
  290. };
  291. static struct nla_policy tcmu_attr_policy[TCMU_ATTR_MAX+1] = {
  292. [TCMU_ATTR_DEVICE] = { .type = NLA_STRING },
  293. [TCMU_ATTR_MINOR] = { .type = NLA_U32 },
  294. [TCMU_ATTR_CMD_STATUS] = { .type = NLA_S32 },
  295. [TCMU_ATTR_DEVICE_ID] = { .type = NLA_U32 },
  296. [TCMU_ATTR_SUPP_KERN_CMD_REPLY] = { .type = NLA_U8 },
  297. };
  298. static int tcmu_genl_cmd_done(struct genl_info *info, int completed_cmd)
  299. {
  300. struct tcmu_dev *udev = NULL;
  301. struct tcmu_nl_cmd *nl_cmd;
  302. int dev_id, rc, ret = 0;
  303. if (!info->attrs[TCMU_ATTR_CMD_STATUS] ||
  304. !info->attrs[TCMU_ATTR_DEVICE_ID]) {
  305. printk(KERN_ERR "TCMU_ATTR_CMD_STATUS or TCMU_ATTR_DEVICE_ID not set, doing nothing\n");
  306. return -EINVAL;
  307. }
  308. dev_id = nla_get_u32(info->attrs[TCMU_ATTR_DEVICE_ID]);
  309. rc = nla_get_s32(info->attrs[TCMU_ATTR_CMD_STATUS]);
  310. mutex_lock(&tcmu_nl_cmd_mutex);
  311. list_for_each_entry(nl_cmd, &tcmu_nl_cmd_list, nl_list) {
  312. if (nl_cmd->udev->se_dev.dev_index == dev_id) {
  313. udev = nl_cmd->udev;
  314. break;
  315. }
  316. }
  317. if (!udev) {
  318. pr_err("tcmu nl cmd %u/%d completion could not find device with dev id %u.\n",
  319. completed_cmd, rc, dev_id);
  320. ret = -ENODEV;
  321. goto unlock;
  322. }
  323. list_del(&nl_cmd->nl_list);
  324. pr_debug("%s genl cmd done got id %d curr %d done %d rc %d stat %d\n",
  325. udev->name, dev_id, nl_cmd->cmd, completed_cmd, rc,
  326. nl_cmd->status);
  327. if (nl_cmd->cmd != completed_cmd) {
  328. pr_err("Mismatched commands on %s (Expecting reply for %d. Current %d).\n",
  329. udev->name, completed_cmd, nl_cmd->cmd);
  330. ret = -EINVAL;
  331. goto unlock;
  332. }
  333. nl_cmd->status = rc;
  334. complete(&nl_cmd->complete);
  335. unlock:
  336. mutex_unlock(&tcmu_nl_cmd_mutex);
  337. return ret;
  338. }
  339. static int tcmu_genl_rm_dev_done(struct sk_buff *skb, struct genl_info *info)
  340. {
  341. return tcmu_genl_cmd_done(info, TCMU_CMD_REMOVED_DEVICE);
  342. }
  343. static int tcmu_genl_add_dev_done(struct sk_buff *skb, struct genl_info *info)
  344. {
  345. return tcmu_genl_cmd_done(info, TCMU_CMD_ADDED_DEVICE);
  346. }
  347. static int tcmu_genl_reconfig_dev_done(struct sk_buff *skb,
  348. struct genl_info *info)
  349. {
  350. return tcmu_genl_cmd_done(info, TCMU_CMD_RECONFIG_DEVICE);
  351. }
  352. static int tcmu_genl_set_features(struct sk_buff *skb, struct genl_info *info)
  353. {
  354. if (info->attrs[TCMU_ATTR_SUPP_KERN_CMD_REPLY]) {
  355. tcmu_kern_cmd_reply_supported =
  356. nla_get_u8(info->attrs[TCMU_ATTR_SUPP_KERN_CMD_REPLY]);
  357. printk(KERN_INFO "tcmu daemon: command reply support %u.\n",
  358. tcmu_kern_cmd_reply_supported);
  359. }
  360. return 0;
  361. }
  362. static const struct genl_small_ops tcmu_genl_ops[] = {
  363. {
  364. .cmd = TCMU_CMD_SET_FEATURES,
  365. .validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
  366. .flags = GENL_ADMIN_PERM,
  367. .doit = tcmu_genl_set_features,
  368. },
  369. {
  370. .cmd = TCMU_CMD_ADDED_DEVICE_DONE,
  371. .validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
  372. .flags = GENL_ADMIN_PERM,
  373. .doit = tcmu_genl_add_dev_done,
  374. },
  375. {
  376. .cmd = TCMU_CMD_REMOVED_DEVICE_DONE,
  377. .validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
  378. .flags = GENL_ADMIN_PERM,
  379. .doit = tcmu_genl_rm_dev_done,
  380. },
  381. {
  382. .cmd = TCMU_CMD_RECONFIG_DEVICE_DONE,
  383. .validate = GENL_DONT_VALIDATE_STRICT | GENL_DONT_VALIDATE_DUMP,
  384. .flags = GENL_ADMIN_PERM,
  385. .doit = tcmu_genl_reconfig_dev_done,
  386. },
  387. };
  388. /* Our generic netlink family */
  389. static struct genl_family tcmu_genl_family __ro_after_init = {
  390. .module = THIS_MODULE,
  391. .hdrsize = 0,
  392. .name = "TCM-USER",
  393. .version = 2,
  394. .maxattr = TCMU_ATTR_MAX,
  395. .policy = tcmu_attr_policy,
  396. .mcgrps = tcmu_mcgrps,
  397. .n_mcgrps = ARRAY_SIZE(tcmu_mcgrps),
  398. .netnsok = true,
  399. .small_ops = tcmu_genl_ops,
  400. .n_small_ops = ARRAY_SIZE(tcmu_genl_ops),
  401. .resv_start_op = TCMU_CMD_SET_FEATURES + 1,
  402. };
  403. #define tcmu_cmd_set_dbi_cur(cmd, index) ((cmd)->dbi_cur = (index))
  404. #define tcmu_cmd_reset_dbi_cur(cmd) tcmu_cmd_set_dbi_cur(cmd, 0)
  405. #define tcmu_cmd_set_dbi(cmd, index) ((cmd)->dbi[(cmd)->dbi_cur++] = (index))
  406. #define tcmu_cmd_get_dbi(cmd) ((cmd)->dbi[(cmd)->dbi_cur++])
  407. static void tcmu_cmd_free_data(struct tcmu_cmd *tcmu_cmd, uint32_t len)
  408. {
  409. struct tcmu_dev *udev = tcmu_cmd->tcmu_dev;
  410. uint32_t i;
  411. for (i = 0; i < len; i++)
  412. clear_bit(tcmu_cmd->dbi[i], udev->data_bitmap);
  413. }
  414. static inline int tcmu_get_empty_block(struct tcmu_dev *udev,
  415. struct tcmu_cmd *tcmu_cmd,
  416. int prev_dbi, int length, int *iov_cnt)
  417. {
  418. XA_STATE(xas, &udev->data_pages, 0);
  419. struct page *page;
  420. int i, cnt, dbi, dpi;
  421. int page_cnt = DIV_ROUND_UP(length, PAGE_SIZE);
  422. dbi = find_first_zero_bit(udev->data_bitmap, udev->dbi_thresh);
  423. if (dbi == udev->dbi_thresh)
  424. return -1;
  425. dpi = dbi * udev->data_pages_per_blk;
  426. /* Count the number of already allocated pages */
  427. xas_set(&xas, dpi);
  428. rcu_read_lock();
  429. for (cnt = 0; xas_next(&xas) && cnt < page_cnt;)
  430. cnt++;
  431. rcu_read_unlock();
  432. for (i = cnt; i < page_cnt; i++) {
  433. /* try to get new zeroed page from the mm */
  434. page = alloc_page(GFP_NOIO | __GFP_ZERO);
  435. if (!page)
  436. break;
  437. if (xa_store(&udev->data_pages, dpi + i, page, GFP_NOIO)) {
  438. __free_page(page);
  439. break;
  440. }
  441. }
  442. if (atomic_add_return(i - cnt, &global_page_count) >
  443. tcmu_global_max_pages)
  444. schedule_delayed_work(&tcmu_unmap_work, 0);
  445. if (i && dbi > udev->dbi_max)
  446. udev->dbi_max = dbi;
  447. set_bit(dbi, udev->data_bitmap);
  448. tcmu_cmd_set_dbi(tcmu_cmd, dbi);
  449. if (dbi != prev_dbi + 1)
  450. *iov_cnt += 1;
  451. return i == page_cnt ? dbi : -1;
  452. }
  453. static int tcmu_get_empty_blocks(struct tcmu_dev *udev,
  454. struct tcmu_cmd *tcmu_cmd, int length)
  455. {
  456. /* start value of dbi + 1 must not be a valid dbi */
  457. int dbi = -2;
  458. int blk_data_len, iov_cnt = 0;
  459. uint32_t blk_size = udev->data_blk_size;
  460. for (; length > 0; length -= blk_size) {
  461. blk_data_len = min_t(uint32_t, length, blk_size);
  462. dbi = tcmu_get_empty_block(udev, tcmu_cmd, dbi, blk_data_len,
  463. &iov_cnt);
  464. if (dbi < 0)
  465. return -1;
  466. }
  467. return iov_cnt;
  468. }
  469. static inline void tcmu_free_cmd(struct tcmu_cmd *tcmu_cmd)
  470. {
  471. kfree(tcmu_cmd->dbi);
  472. kmem_cache_free(tcmu_cmd_cache, tcmu_cmd);
  473. }
  474. static inline void tcmu_cmd_set_block_cnts(struct tcmu_cmd *cmd)
  475. {
  476. int i, len;
  477. struct se_cmd *se_cmd = cmd->se_cmd;
  478. uint32_t blk_size = cmd->tcmu_dev->data_blk_size;
  479. cmd->dbi_cnt = DIV_ROUND_UP(se_cmd->data_length, blk_size);
  480. if (se_cmd->se_cmd_flags & SCF_BIDI) {
  481. BUG_ON(!(se_cmd->t_bidi_data_sg && se_cmd->t_bidi_data_nents));
  482. for (i = 0, len = 0; i < se_cmd->t_bidi_data_nents; i++)
  483. len += se_cmd->t_bidi_data_sg[i].length;
  484. cmd->dbi_bidi_cnt = DIV_ROUND_UP(len, blk_size);
  485. cmd->dbi_cnt += cmd->dbi_bidi_cnt;
  486. cmd->data_len_bidi = len;
  487. }
  488. }
  489. static int new_block_to_iov(struct tcmu_dev *udev, struct tcmu_cmd *cmd,
  490. struct iovec **iov, int prev_dbi, int len)
  491. {
  492. /* Get the next dbi */
  493. int dbi = tcmu_cmd_get_dbi(cmd);
  494. /* Do not add more than udev->data_blk_size to iov */
  495. len = min_t(int, len, udev->data_blk_size);
  496. /*
  497. * The following code will gather and map the blocks to the same iovec
  498. * when the blocks are all next to each other.
  499. */
  500. if (dbi != prev_dbi + 1) {
  501. /* dbi is not next to previous dbi, so start new iov */
  502. if (prev_dbi >= 0)
  503. (*iov)++;
  504. /* write offset relative to mb_addr */
  505. (*iov)->iov_base = (void __user *)
  506. (udev->data_off + dbi * udev->data_blk_size);
  507. }
  508. (*iov)->iov_len += len;
  509. return dbi;
  510. }
  511. static void tcmu_setup_iovs(struct tcmu_dev *udev, struct tcmu_cmd *cmd,
  512. struct iovec **iov, int data_length)
  513. {
  514. /* start value of dbi + 1 must not be a valid dbi */
  515. int dbi = -2;
  516. /* We prepare the IOVs for DMA_FROM_DEVICE transfer direction */
  517. for (; data_length > 0; data_length -= udev->data_blk_size)
  518. dbi = new_block_to_iov(udev, cmd, iov, dbi, data_length);
  519. }
  520. static struct tcmu_cmd *tcmu_alloc_cmd(struct se_cmd *se_cmd)
  521. {
  522. struct se_device *se_dev = se_cmd->se_dev;
  523. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  524. struct tcmu_cmd *tcmu_cmd;
  525. tcmu_cmd = kmem_cache_zalloc(tcmu_cmd_cache, GFP_NOIO);
  526. if (!tcmu_cmd)
  527. return NULL;
  528. INIT_LIST_HEAD(&tcmu_cmd->queue_entry);
  529. tcmu_cmd->se_cmd = se_cmd;
  530. tcmu_cmd->tcmu_dev = udev;
  531. tcmu_cmd_set_block_cnts(tcmu_cmd);
  532. tcmu_cmd->dbi = kcalloc(tcmu_cmd->dbi_cnt, sizeof(uint32_t),
  533. GFP_NOIO);
  534. if (!tcmu_cmd->dbi) {
  535. kmem_cache_free(tcmu_cmd_cache, tcmu_cmd);
  536. return NULL;
  537. }
  538. return tcmu_cmd;
  539. }
  540. static inline void tcmu_flush_dcache_range(void *vaddr, size_t size)
  541. {
  542. unsigned long offset = offset_in_page(vaddr);
  543. void *start = vaddr - offset;
  544. size = round_up(size+offset, PAGE_SIZE);
  545. while (size) {
  546. flush_dcache_page(vmalloc_to_page(start));
  547. start += PAGE_SIZE;
  548. size -= PAGE_SIZE;
  549. }
  550. }
  551. /*
  552. * Some ring helper functions. We don't assume size is a power of 2 so
  553. * we can't use circ_buf.h.
  554. */
  555. static inline size_t spc_used(size_t head, size_t tail, size_t size)
  556. {
  557. int diff = head - tail;
  558. if (diff >= 0)
  559. return diff;
  560. else
  561. return size + diff;
  562. }
  563. static inline size_t spc_free(size_t head, size_t tail, size_t size)
  564. {
  565. /* Keep 1 byte unused or we can't tell full from empty */
  566. return (size - spc_used(head, tail, size) - 1);
  567. }
  568. static inline size_t head_to_end(size_t head, size_t size)
  569. {
  570. return size - head;
  571. }
  572. #define UPDATE_HEAD(head, used, size) smp_store_release(&head, ((head % size) + used) % size)
  573. #define TCMU_SG_TO_DATA_AREA 1
  574. #define TCMU_DATA_AREA_TO_SG 2
  575. static inline void tcmu_copy_data(struct tcmu_dev *udev,
  576. struct tcmu_cmd *tcmu_cmd, uint32_t direction,
  577. struct scatterlist *sg, unsigned int sg_nents,
  578. struct iovec **iov, size_t data_len)
  579. {
  580. /* start value of dbi + 1 must not be a valid dbi */
  581. int dbi = -2;
  582. size_t page_remaining, cp_len;
  583. int page_cnt, page_inx, dpi;
  584. struct sg_mapping_iter sg_iter;
  585. unsigned int sg_flags;
  586. struct page *page;
  587. void *data_page_start, *data_addr;
  588. if (direction == TCMU_SG_TO_DATA_AREA)
  589. sg_flags = SG_MITER_ATOMIC | SG_MITER_FROM_SG;
  590. else
  591. sg_flags = SG_MITER_ATOMIC | SG_MITER_TO_SG;
  592. sg_miter_start(&sg_iter, sg, sg_nents, sg_flags);
  593. while (data_len) {
  594. if (direction == TCMU_SG_TO_DATA_AREA)
  595. dbi = new_block_to_iov(udev, tcmu_cmd, iov, dbi,
  596. data_len);
  597. else
  598. dbi = tcmu_cmd_get_dbi(tcmu_cmd);
  599. page_cnt = DIV_ROUND_UP(data_len, PAGE_SIZE);
  600. if (page_cnt > udev->data_pages_per_blk)
  601. page_cnt = udev->data_pages_per_blk;
  602. dpi = dbi * udev->data_pages_per_blk;
  603. for (page_inx = 0; page_inx < page_cnt && data_len;
  604. page_inx++, dpi++) {
  605. page = xa_load(&udev->data_pages, dpi);
  606. if (direction == TCMU_DATA_AREA_TO_SG)
  607. flush_dcache_page(page);
  608. data_page_start = kmap_atomic(page);
  609. page_remaining = PAGE_SIZE;
  610. while (page_remaining && data_len) {
  611. if (!sg_miter_next(&sg_iter)) {
  612. /* set length to 0 to abort outer loop */
  613. data_len = 0;
  614. pr_debug("%s: aborting data copy due to exhausted sg_list\n",
  615. __func__);
  616. break;
  617. }
  618. cp_len = min3(sg_iter.length, page_remaining,
  619. data_len);
  620. data_addr = data_page_start +
  621. PAGE_SIZE - page_remaining;
  622. if (direction == TCMU_SG_TO_DATA_AREA)
  623. memcpy(data_addr, sg_iter.addr, cp_len);
  624. else
  625. memcpy(sg_iter.addr, data_addr, cp_len);
  626. data_len -= cp_len;
  627. page_remaining -= cp_len;
  628. sg_iter.consumed = cp_len;
  629. }
  630. sg_miter_stop(&sg_iter);
  631. kunmap_atomic(data_page_start);
  632. if (direction == TCMU_SG_TO_DATA_AREA)
  633. flush_dcache_page(page);
  634. }
  635. }
  636. }
  637. static void scatter_data_area(struct tcmu_dev *udev, struct tcmu_cmd *tcmu_cmd,
  638. struct iovec **iov)
  639. {
  640. struct se_cmd *se_cmd = tcmu_cmd->se_cmd;
  641. tcmu_copy_data(udev, tcmu_cmd, TCMU_SG_TO_DATA_AREA, se_cmd->t_data_sg,
  642. se_cmd->t_data_nents, iov, se_cmd->data_length);
  643. }
  644. static void gather_data_area(struct tcmu_dev *udev, struct tcmu_cmd *tcmu_cmd,
  645. bool bidi, uint32_t read_len)
  646. {
  647. struct se_cmd *se_cmd = tcmu_cmd->se_cmd;
  648. struct scatterlist *data_sg;
  649. unsigned int data_nents;
  650. if (!bidi) {
  651. data_sg = se_cmd->t_data_sg;
  652. data_nents = se_cmd->t_data_nents;
  653. } else {
  654. /*
  655. * For bidi case, the first count blocks are for Data-Out
  656. * buffer blocks, and before gathering the Data-In buffer
  657. * the Data-Out buffer blocks should be skipped.
  658. */
  659. tcmu_cmd_set_dbi_cur(tcmu_cmd,
  660. tcmu_cmd->dbi_cnt - tcmu_cmd->dbi_bidi_cnt);
  661. data_sg = se_cmd->t_bidi_data_sg;
  662. data_nents = se_cmd->t_bidi_data_nents;
  663. }
  664. tcmu_copy_data(udev, tcmu_cmd, TCMU_DATA_AREA_TO_SG, data_sg,
  665. data_nents, NULL, read_len);
  666. }
  667. static inline size_t spc_bitmap_free(unsigned long *bitmap, uint32_t thresh)
  668. {
  669. return thresh - bitmap_weight(bitmap, thresh);
  670. }
  671. /*
  672. * We can't queue a command until we have space available on the cmd ring.
  673. *
  674. * Called with ring lock held.
  675. */
  676. static bool is_ring_space_avail(struct tcmu_dev *udev, size_t cmd_size)
  677. {
  678. struct tcmu_mailbox *mb = udev->mb_addr;
  679. size_t space, cmd_needed;
  680. u32 cmd_head;
  681. tcmu_flush_dcache_range(mb, sizeof(*mb));
  682. cmd_head = mb->cmd_head % udev->cmdr_size; /* UAM */
  683. /*
  684. * If cmd end-of-ring space is too small then we need space for a NOP plus
  685. * original cmd - cmds are internally contiguous.
  686. */
  687. if (head_to_end(cmd_head, udev->cmdr_size) >= cmd_size)
  688. cmd_needed = cmd_size;
  689. else
  690. cmd_needed = cmd_size + head_to_end(cmd_head, udev->cmdr_size);
  691. space = spc_free(cmd_head, udev->cmdr_last_cleaned, udev->cmdr_size);
  692. if (space < cmd_needed) {
  693. pr_debug("no cmd space: %u %u %u\n", cmd_head,
  694. udev->cmdr_last_cleaned, udev->cmdr_size);
  695. return false;
  696. }
  697. return true;
  698. }
  699. /*
  700. * We have to allocate data buffers before we can queue a command.
  701. * Returns -1 on error (not enough space) or number of needed iovs on success
  702. *
  703. * Called with ring lock held.
  704. */
  705. static int tcmu_alloc_data_space(struct tcmu_dev *udev, struct tcmu_cmd *cmd,
  706. int *iov_bidi_cnt)
  707. {
  708. int space, iov_cnt = 0, ret = 0;
  709. if (!cmd->dbi_cnt)
  710. goto wr_iov_cnts;
  711. /* try to check and get the data blocks as needed */
  712. space = spc_bitmap_free(udev->data_bitmap, udev->dbi_thresh);
  713. if (space < cmd->dbi_cnt) {
  714. unsigned long blocks_left =
  715. (udev->max_blocks - udev->dbi_thresh) + space;
  716. if (blocks_left < cmd->dbi_cnt) {
  717. pr_debug("no data space: only %lu available, but ask for %u\n",
  718. blocks_left * udev->data_blk_size,
  719. cmd->dbi_cnt * udev->data_blk_size);
  720. return -1;
  721. }
  722. udev->dbi_thresh += cmd->dbi_cnt;
  723. if (udev->dbi_thresh > udev->max_blocks)
  724. udev->dbi_thresh = udev->max_blocks;
  725. }
  726. iov_cnt = tcmu_get_empty_blocks(udev, cmd, cmd->se_cmd->data_length);
  727. if (iov_cnt < 0)
  728. return -1;
  729. if (cmd->dbi_bidi_cnt) {
  730. ret = tcmu_get_empty_blocks(udev, cmd, cmd->data_len_bidi);
  731. if (ret < 0)
  732. return -1;
  733. }
  734. wr_iov_cnts:
  735. *iov_bidi_cnt = ret;
  736. return iov_cnt + ret;
  737. }
  738. static inline size_t tcmu_cmd_get_base_cmd_size(size_t iov_cnt)
  739. {
  740. return max(offsetof(struct tcmu_cmd_entry, req.iov[iov_cnt]),
  741. sizeof(struct tcmu_cmd_entry));
  742. }
  743. static inline size_t tcmu_cmd_get_cmd_size(struct tcmu_cmd *tcmu_cmd,
  744. size_t base_command_size)
  745. {
  746. struct se_cmd *se_cmd = tcmu_cmd->se_cmd;
  747. size_t command_size;
  748. command_size = base_command_size +
  749. round_up(scsi_command_size(se_cmd->t_task_cdb),
  750. TCMU_OP_ALIGN_SIZE);
  751. WARN_ON(command_size & (TCMU_OP_ALIGN_SIZE-1));
  752. return command_size;
  753. }
  754. static void tcmu_setup_cmd_timer(struct tcmu_cmd *tcmu_cmd, unsigned int tmo,
  755. struct timer_list *timer)
  756. {
  757. if (!tmo)
  758. return;
  759. tcmu_cmd->deadline = round_jiffies_up(jiffies + msecs_to_jiffies(tmo));
  760. if (!timer_pending(timer))
  761. mod_timer(timer, tcmu_cmd->deadline);
  762. pr_debug("Timeout set up for cmd %p, dev = %s, tmo = %lu\n", tcmu_cmd,
  763. tcmu_cmd->tcmu_dev->name, tmo / MSEC_PER_SEC);
  764. }
  765. static int add_to_qfull_queue(struct tcmu_cmd *tcmu_cmd)
  766. {
  767. struct tcmu_dev *udev = tcmu_cmd->tcmu_dev;
  768. unsigned int tmo;
  769. /*
  770. * For backwards compat if qfull_time_out is not set use
  771. * cmd_time_out and if that's not set use the default time out.
  772. */
  773. if (!udev->qfull_time_out)
  774. return -ETIMEDOUT;
  775. else if (udev->qfull_time_out > 0)
  776. tmo = udev->qfull_time_out;
  777. else if (udev->cmd_time_out)
  778. tmo = udev->cmd_time_out;
  779. else
  780. tmo = TCMU_TIME_OUT;
  781. tcmu_setup_cmd_timer(tcmu_cmd, tmo, &udev->qfull_timer);
  782. list_add_tail(&tcmu_cmd->queue_entry, &udev->qfull_queue);
  783. pr_debug("adding cmd %p on dev %s to ring space wait queue\n",
  784. tcmu_cmd, udev->name);
  785. return 0;
  786. }
  787. static uint32_t ring_insert_padding(struct tcmu_dev *udev, size_t cmd_size)
  788. {
  789. struct tcmu_cmd_entry_hdr *hdr;
  790. struct tcmu_mailbox *mb = udev->mb_addr;
  791. uint32_t cmd_head = mb->cmd_head % udev->cmdr_size; /* UAM */
  792. /* Insert a PAD if end-of-ring space is too small */
  793. if (head_to_end(cmd_head, udev->cmdr_size) < cmd_size) {
  794. size_t pad_size = head_to_end(cmd_head, udev->cmdr_size);
  795. hdr = udev->cmdr + cmd_head;
  796. tcmu_hdr_set_op(&hdr->len_op, TCMU_OP_PAD);
  797. tcmu_hdr_set_len(&hdr->len_op, pad_size);
  798. hdr->cmd_id = 0; /* not used for PAD */
  799. hdr->kflags = 0;
  800. hdr->uflags = 0;
  801. tcmu_flush_dcache_range(hdr, sizeof(*hdr));
  802. UPDATE_HEAD(mb->cmd_head, pad_size, udev->cmdr_size);
  803. tcmu_flush_dcache_range(mb, sizeof(*mb));
  804. cmd_head = mb->cmd_head % udev->cmdr_size; /* UAM */
  805. WARN_ON(cmd_head != 0);
  806. }
  807. return cmd_head;
  808. }
  809. static void tcmu_unplug_device(struct se_dev_plug *se_plug)
  810. {
  811. struct se_device *se_dev = se_plug->se_dev;
  812. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  813. clear_bit(TCMU_DEV_BIT_PLUGGED, &udev->flags);
  814. uio_event_notify(&udev->uio_info);
  815. }
  816. static struct se_dev_plug *tcmu_plug_device(struct se_device *se_dev)
  817. {
  818. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  819. if (!test_and_set_bit(TCMU_DEV_BIT_PLUGGED, &udev->flags))
  820. return &udev->se_plug;
  821. return NULL;
  822. }
  823. /**
  824. * queue_cmd_ring - queue cmd to ring or internally
  825. * @tcmu_cmd: cmd to queue
  826. * @scsi_err: TCM error code if failure (-1) returned.
  827. *
  828. * Returns:
  829. * -1 we cannot queue internally or to the ring.
  830. * 0 success
  831. * 1 internally queued to wait for ring memory to free.
  832. */
  833. static int queue_cmd_ring(struct tcmu_cmd *tcmu_cmd, sense_reason_t *scsi_err)
  834. {
  835. struct tcmu_dev *udev = tcmu_cmd->tcmu_dev;
  836. struct se_cmd *se_cmd = tcmu_cmd->se_cmd;
  837. size_t base_command_size, command_size;
  838. struct tcmu_mailbox *mb = udev->mb_addr;
  839. struct tcmu_cmd_entry *entry;
  840. struct iovec *iov;
  841. int iov_cnt, iov_bidi_cnt;
  842. uint32_t cmd_id, cmd_head;
  843. uint64_t cdb_off;
  844. uint32_t blk_size = udev->data_blk_size;
  845. /* size of data buffer needed */
  846. size_t data_length = (size_t)tcmu_cmd->dbi_cnt * blk_size;
  847. *scsi_err = TCM_NO_SENSE;
  848. if (test_bit(TCMU_DEV_BIT_BLOCKED, &udev->flags)) {
  849. *scsi_err = TCM_LUN_BUSY;
  850. return -1;
  851. }
  852. if (test_bit(TCMU_DEV_BIT_BROKEN, &udev->flags)) {
  853. *scsi_err = TCM_LOGICAL_UNIT_COMMUNICATION_FAILURE;
  854. return -1;
  855. }
  856. if (!list_empty(&udev->qfull_queue))
  857. goto queue;
  858. if (data_length > (size_t)udev->max_blocks * blk_size) {
  859. pr_warn("TCMU: Request of size %zu is too big for %zu data area\n",
  860. data_length, (size_t)udev->max_blocks * blk_size);
  861. *scsi_err = TCM_INVALID_CDB_FIELD;
  862. return -1;
  863. }
  864. iov_cnt = tcmu_alloc_data_space(udev, tcmu_cmd, &iov_bidi_cnt);
  865. if (iov_cnt < 0)
  866. goto free_and_queue;
  867. /*
  868. * Must be a certain minimum size for response sense info, but
  869. * also may be larger if the iov array is large.
  870. */
  871. base_command_size = tcmu_cmd_get_base_cmd_size(iov_cnt);
  872. command_size = tcmu_cmd_get_cmd_size(tcmu_cmd, base_command_size);
  873. if (command_size > (udev->cmdr_size / 2)) {
  874. pr_warn("TCMU: Request of size %zu is too big for %u cmd ring\n",
  875. command_size, udev->cmdr_size);
  876. tcmu_cmd_free_data(tcmu_cmd, tcmu_cmd->dbi_cur);
  877. *scsi_err = TCM_INVALID_CDB_FIELD;
  878. return -1;
  879. }
  880. if (!is_ring_space_avail(udev, command_size))
  881. /*
  882. * Don't leave commands partially setup because the unmap
  883. * thread might need the blocks to make forward progress.
  884. */
  885. goto free_and_queue;
  886. if (xa_alloc(&udev->commands, &cmd_id, tcmu_cmd, XA_LIMIT(1, 0xffff),
  887. GFP_NOWAIT) < 0) {
  888. pr_err("tcmu: Could not allocate cmd id.\n");
  889. tcmu_cmd_free_data(tcmu_cmd, tcmu_cmd->dbi_cnt);
  890. *scsi_err = TCM_OUT_OF_RESOURCES;
  891. return -1;
  892. }
  893. tcmu_cmd->cmd_id = cmd_id;
  894. pr_debug("allocated cmd id %u for cmd %p dev %s\n", tcmu_cmd->cmd_id,
  895. tcmu_cmd, udev->name);
  896. cmd_head = ring_insert_padding(udev, command_size);
  897. entry = udev->cmdr + cmd_head;
  898. memset(entry, 0, command_size);
  899. tcmu_hdr_set_op(&entry->hdr.len_op, TCMU_OP_CMD);
  900. /* prepare iov list and copy data to data area if necessary */
  901. tcmu_cmd_reset_dbi_cur(tcmu_cmd);
  902. iov = &entry->req.iov[0];
  903. if (se_cmd->data_direction == DMA_TO_DEVICE ||
  904. se_cmd->se_cmd_flags & SCF_BIDI)
  905. scatter_data_area(udev, tcmu_cmd, &iov);
  906. else
  907. tcmu_setup_iovs(udev, tcmu_cmd, &iov, se_cmd->data_length);
  908. entry->req.iov_cnt = iov_cnt - iov_bidi_cnt;
  909. /* Handle BIDI commands */
  910. if (se_cmd->se_cmd_flags & SCF_BIDI) {
  911. iov++;
  912. tcmu_setup_iovs(udev, tcmu_cmd, &iov, tcmu_cmd->data_len_bidi);
  913. entry->req.iov_bidi_cnt = iov_bidi_cnt;
  914. }
  915. tcmu_setup_cmd_timer(tcmu_cmd, udev->cmd_time_out, &udev->cmd_timer);
  916. entry->hdr.cmd_id = tcmu_cmd->cmd_id;
  917. tcmu_hdr_set_len(&entry->hdr.len_op, command_size);
  918. /* All offsets relative to mb_addr, not start of entry! */
  919. cdb_off = CMDR_OFF + cmd_head + base_command_size;
  920. memcpy((void *) mb + cdb_off, se_cmd->t_task_cdb, scsi_command_size(se_cmd->t_task_cdb));
  921. entry->req.cdb_off = cdb_off;
  922. tcmu_flush_dcache_range(entry, command_size);
  923. UPDATE_HEAD(mb->cmd_head, command_size, udev->cmdr_size);
  924. tcmu_flush_dcache_range(mb, sizeof(*mb));
  925. list_add_tail(&tcmu_cmd->queue_entry, &udev->inflight_queue);
  926. if (!test_bit(TCMU_DEV_BIT_PLUGGED, &udev->flags))
  927. uio_event_notify(&udev->uio_info);
  928. return 0;
  929. free_and_queue:
  930. tcmu_cmd_free_data(tcmu_cmd, tcmu_cmd->dbi_cur);
  931. tcmu_cmd_reset_dbi_cur(tcmu_cmd);
  932. queue:
  933. if (add_to_qfull_queue(tcmu_cmd)) {
  934. *scsi_err = TCM_OUT_OF_RESOURCES;
  935. return -1;
  936. }
  937. return 1;
  938. }
  939. /**
  940. * queue_tmr_ring - queue tmr info to ring or internally
  941. * @udev: related tcmu_dev
  942. * @tmr: tcmu_tmr containing tmr info to queue
  943. *
  944. * Returns:
  945. * 0 success
  946. * 1 internally queued to wait for ring memory to free.
  947. */
  948. static int
  949. queue_tmr_ring(struct tcmu_dev *udev, struct tcmu_tmr *tmr)
  950. {
  951. struct tcmu_tmr_entry *entry;
  952. int cmd_size;
  953. int id_list_sz;
  954. struct tcmu_mailbox *mb = udev->mb_addr;
  955. uint32_t cmd_head;
  956. if (test_bit(TCMU_DEV_BIT_BROKEN, &udev->flags))
  957. goto out_free;
  958. id_list_sz = sizeof(tmr->tmr_cmd_ids[0]) * tmr->tmr_cmd_cnt;
  959. cmd_size = round_up(sizeof(*entry) + id_list_sz, TCMU_OP_ALIGN_SIZE);
  960. if (!list_empty(&udev->tmr_queue) ||
  961. !is_ring_space_avail(udev, cmd_size)) {
  962. list_add_tail(&tmr->queue_entry, &udev->tmr_queue);
  963. pr_debug("adding tmr %p on dev %s to TMR ring space wait queue\n",
  964. tmr, udev->name);
  965. return 1;
  966. }
  967. cmd_head = ring_insert_padding(udev, cmd_size);
  968. entry = udev->cmdr + cmd_head;
  969. memset(entry, 0, cmd_size);
  970. tcmu_hdr_set_op(&entry->hdr.len_op, TCMU_OP_TMR);
  971. tcmu_hdr_set_len(&entry->hdr.len_op, cmd_size);
  972. entry->tmr_type = tmr->tmr_type;
  973. entry->cmd_cnt = tmr->tmr_cmd_cnt;
  974. memcpy(&entry->cmd_ids[0], &tmr->tmr_cmd_ids[0], id_list_sz);
  975. tcmu_flush_dcache_range(entry, cmd_size);
  976. UPDATE_HEAD(mb->cmd_head, cmd_size, udev->cmdr_size);
  977. tcmu_flush_dcache_range(mb, sizeof(*mb));
  978. uio_event_notify(&udev->uio_info);
  979. out_free:
  980. kfree(tmr);
  981. return 0;
  982. }
  983. static sense_reason_t
  984. tcmu_queue_cmd(struct se_cmd *se_cmd)
  985. {
  986. struct se_device *se_dev = se_cmd->se_dev;
  987. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  988. struct tcmu_cmd *tcmu_cmd;
  989. sense_reason_t scsi_ret = TCM_CHECK_CONDITION_ABORT_CMD;
  990. int ret = -1;
  991. tcmu_cmd = tcmu_alloc_cmd(se_cmd);
  992. if (!tcmu_cmd)
  993. return TCM_LOGICAL_UNIT_COMMUNICATION_FAILURE;
  994. mutex_lock(&udev->cmdr_lock);
  995. if (!(se_cmd->transport_state & CMD_T_ABORTED))
  996. ret = queue_cmd_ring(tcmu_cmd, &scsi_ret);
  997. if (ret < 0)
  998. tcmu_free_cmd(tcmu_cmd);
  999. else
  1000. se_cmd->priv = tcmu_cmd;
  1001. mutex_unlock(&udev->cmdr_lock);
  1002. return scsi_ret;
  1003. }
  1004. static void tcmu_set_next_deadline(struct list_head *queue,
  1005. struct timer_list *timer)
  1006. {
  1007. struct tcmu_cmd *cmd;
  1008. if (!list_empty(queue)) {
  1009. cmd = list_first_entry(queue, struct tcmu_cmd, queue_entry);
  1010. mod_timer(timer, cmd->deadline);
  1011. } else
  1012. del_timer(timer);
  1013. }
  1014. static int
  1015. tcmu_tmr_type(enum tcm_tmreq_table tmf)
  1016. {
  1017. switch (tmf) {
  1018. case TMR_ABORT_TASK: return TCMU_TMR_ABORT_TASK;
  1019. case TMR_ABORT_TASK_SET: return TCMU_TMR_ABORT_TASK_SET;
  1020. case TMR_CLEAR_ACA: return TCMU_TMR_CLEAR_ACA;
  1021. case TMR_CLEAR_TASK_SET: return TCMU_TMR_CLEAR_TASK_SET;
  1022. case TMR_LUN_RESET: return TCMU_TMR_LUN_RESET;
  1023. case TMR_TARGET_WARM_RESET: return TCMU_TMR_TARGET_WARM_RESET;
  1024. case TMR_TARGET_COLD_RESET: return TCMU_TMR_TARGET_COLD_RESET;
  1025. case TMR_LUN_RESET_PRO: return TCMU_TMR_LUN_RESET_PRO;
  1026. default: return TCMU_TMR_UNKNOWN;
  1027. }
  1028. }
  1029. static void
  1030. tcmu_tmr_notify(struct se_device *se_dev, enum tcm_tmreq_table tmf,
  1031. struct list_head *cmd_list)
  1032. {
  1033. int i = 0, cmd_cnt = 0;
  1034. bool unqueued = false;
  1035. struct tcmu_cmd *cmd;
  1036. struct se_cmd *se_cmd;
  1037. struct tcmu_tmr *tmr;
  1038. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  1039. mutex_lock(&udev->cmdr_lock);
  1040. /* First we check for aborted commands in qfull_queue */
  1041. list_for_each_entry(se_cmd, cmd_list, state_list) {
  1042. i++;
  1043. if (!se_cmd->priv)
  1044. continue;
  1045. cmd = se_cmd->priv;
  1046. /* Commands on qfull queue have no id yet */
  1047. if (cmd->cmd_id) {
  1048. cmd_cnt++;
  1049. continue;
  1050. }
  1051. pr_debug("Removing aborted command %p from queue on dev %s.\n",
  1052. cmd, udev->name);
  1053. list_del_init(&cmd->queue_entry);
  1054. tcmu_free_cmd(cmd);
  1055. se_cmd->priv = NULL;
  1056. target_complete_cmd(se_cmd, SAM_STAT_TASK_ABORTED);
  1057. unqueued = true;
  1058. }
  1059. if (unqueued)
  1060. tcmu_set_next_deadline(&udev->qfull_queue, &udev->qfull_timer);
  1061. if (!test_bit(TCMU_DEV_BIT_TMR_NOTIFY, &udev->flags))
  1062. goto unlock;
  1063. pr_debug("TMR event %d on dev %s, aborted cmds %d, afflicted cmd_ids %d\n",
  1064. tcmu_tmr_type(tmf), udev->name, i, cmd_cnt);
  1065. tmr = kmalloc(struct_size(tmr, tmr_cmd_ids, cmd_cnt), GFP_NOIO);
  1066. if (!tmr)
  1067. goto unlock;
  1068. tmr->tmr_type = tcmu_tmr_type(tmf);
  1069. tmr->tmr_cmd_cnt = cmd_cnt;
  1070. if (cmd_cnt != 0) {
  1071. cmd_cnt = 0;
  1072. list_for_each_entry(se_cmd, cmd_list, state_list) {
  1073. if (!se_cmd->priv)
  1074. continue;
  1075. cmd = se_cmd->priv;
  1076. if (cmd->cmd_id)
  1077. tmr->tmr_cmd_ids[cmd_cnt++] = cmd->cmd_id;
  1078. }
  1079. }
  1080. queue_tmr_ring(udev, tmr);
  1081. unlock:
  1082. mutex_unlock(&udev->cmdr_lock);
  1083. }
  1084. static bool tcmu_handle_completion(struct tcmu_cmd *cmd,
  1085. struct tcmu_cmd_entry *entry, bool keep_buf)
  1086. {
  1087. struct se_cmd *se_cmd = cmd->se_cmd;
  1088. struct tcmu_dev *udev = cmd->tcmu_dev;
  1089. bool read_len_valid = false;
  1090. bool ret = true;
  1091. uint32_t read_len;
  1092. /*
  1093. * cmd has been completed already from timeout, just reclaim
  1094. * data area space and free cmd
  1095. */
  1096. if (test_bit(TCMU_CMD_BIT_EXPIRED, &cmd->flags)) {
  1097. WARN_ON_ONCE(se_cmd);
  1098. goto out;
  1099. }
  1100. if (test_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags)) {
  1101. pr_err("cmd_id %u already completed with KEEP_BUF, ring is broken\n",
  1102. entry->hdr.cmd_id);
  1103. set_bit(TCMU_DEV_BIT_BROKEN, &udev->flags);
  1104. ret = false;
  1105. goto out;
  1106. }
  1107. list_del_init(&cmd->queue_entry);
  1108. tcmu_cmd_reset_dbi_cur(cmd);
  1109. if (entry->hdr.uflags & TCMU_UFLAG_UNKNOWN_OP) {
  1110. pr_warn("TCMU: Userspace set UNKNOWN_OP flag on se_cmd %p\n",
  1111. cmd->se_cmd);
  1112. entry->rsp.scsi_status = SAM_STAT_CHECK_CONDITION;
  1113. goto done;
  1114. }
  1115. read_len = se_cmd->data_length;
  1116. if (se_cmd->data_direction == DMA_FROM_DEVICE &&
  1117. (entry->hdr.uflags & TCMU_UFLAG_READ_LEN) && entry->rsp.read_len) {
  1118. read_len_valid = true;
  1119. if (entry->rsp.read_len < read_len)
  1120. read_len = entry->rsp.read_len;
  1121. }
  1122. if (entry->rsp.scsi_status == SAM_STAT_CHECK_CONDITION) {
  1123. transport_copy_sense_to_cmd(se_cmd, entry->rsp.sense_buffer);
  1124. if (!read_len_valid )
  1125. goto done;
  1126. else
  1127. se_cmd->se_cmd_flags |= SCF_TREAT_READ_AS_NORMAL;
  1128. }
  1129. if (se_cmd->se_cmd_flags & SCF_BIDI) {
  1130. /* Get Data-In buffer before clean up */
  1131. gather_data_area(udev, cmd, true, read_len);
  1132. } else if (se_cmd->data_direction == DMA_FROM_DEVICE) {
  1133. gather_data_area(udev, cmd, false, read_len);
  1134. } else if (se_cmd->data_direction == DMA_TO_DEVICE) {
  1135. /* TODO: */
  1136. } else if (se_cmd->data_direction != DMA_NONE) {
  1137. pr_warn("TCMU: data direction was %d!\n",
  1138. se_cmd->data_direction);
  1139. }
  1140. done:
  1141. se_cmd->priv = NULL;
  1142. if (read_len_valid) {
  1143. pr_debug("read_len = %d\n", read_len);
  1144. target_complete_cmd_with_length(cmd->se_cmd,
  1145. entry->rsp.scsi_status, read_len);
  1146. } else
  1147. target_complete_cmd(cmd->se_cmd, entry->rsp.scsi_status);
  1148. out:
  1149. if (!keep_buf) {
  1150. tcmu_cmd_free_data(cmd, cmd->dbi_cnt);
  1151. tcmu_free_cmd(cmd);
  1152. } else {
  1153. /*
  1154. * Keep this command after completion, since userspace still
  1155. * needs the data buffer. Mark it with TCMU_CMD_BIT_KEEP_BUF
  1156. * and reset potential TCMU_CMD_BIT_EXPIRED, so we don't accept
  1157. * a second completion later.
  1158. * Userspace can free the buffer later by writing the cmd_id
  1159. * to new action attribute free_kept_buf.
  1160. */
  1161. clear_bit(TCMU_CMD_BIT_EXPIRED, &cmd->flags);
  1162. set_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags);
  1163. }
  1164. return ret;
  1165. }
  1166. static int tcmu_run_tmr_queue(struct tcmu_dev *udev)
  1167. {
  1168. struct tcmu_tmr *tmr, *tmp;
  1169. LIST_HEAD(tmrs);
  1170. if (list_empty(&udev->tmr_queue))
  1171. return 1;
  1172. pr_debug("running %s's tmr queue\n", udev->name);
  1173. list_splice_init(&udev->tmr_queue, &tmrs);
  1174. list_for_each_entry_safe(tmr, tmp, &tmrs, queue_entry) {
  1175. list_del_init(&tmr->queue_entry);
  1176. pr_debug("removing tmr %p on dev %s from queue\n",
  1177. tmr, udev->name);
  1178. if (queue_tmr_ring(udev, tmr)) {
  1179. pr_debug("ran out of space during tmr queue run\n");
  1180. /*
  1181. * tmr was requeued, so just put all tmrs back in
  1182. * the queue
  1183. */
  1184. list_splice_tail(&tmrs, &udev->tmr_queue);
  1185. return 0;
  1186. }
  1187. }
  1188. return 1;
  1189. }
  1190. static bool tcmu_handle_completions(struct tcmu_dev *udev)
  1191. {
  1192. struct tcmu_mailbox *mb;
  1193. struct tcmu_cmd *cmd;
  1194. bool free_space = false;
  1195. if (test_bit(TCMU_DEV_BIT_BROKEN, &udev->flags)) {
  1196. pr_err("ring broken, not handling completions\n");
  1197. return false;
  1198. }
  1199. mb = udev->mb_addr;
  1200. tcmu_flush_dcache_range(mb, sizeof(*mb));
  1201. while (udev->cmdr_last_cleaned != READ_ONCE(mb->cmd_tail)) {
  1202. struct tcmu_cmd_entry *entry = udev->cmdr + udev->cmdr_last_cleaned;
  1203. bool keep_buf;
  1204. /*
  1205. * Flush max. up to end of cmd ring since current entry might
  1206. * be a padding that is shorter than sizeof(*entry)
  1207. */
  1208. size_t ring_left = head_to_end(udev->cmdr_last_cleaned,
  1209. udev->cmdr_size);
  1210. tcmu_flush_dcache_range(entry, ring_left < sizeof(*entry) ?
  1211. ring_left : sizeof(*entry));
  1212. free_space = true;
  1213. if (tcmu_hdr_get_op(entry->hdr.len_op) == TCMU_OP_PAD ||
  1214. tcmu_hdr_get_op(entry->hdr.len_op) == TCMU_OP_TMR) {
  1215. UPDATE_HEAD(udev->cmdr_last_cleaned,
  1216. tcmu_hdr_get_len(entry->hdr.len_op),
  1217. udev->cmdr_size);
  1218. continue;
  1219. }
  1220. WARN_ON(tcmu_hdr_get_op(entry->hdr.len_op) != TCMU_OP_CMD);
  1221. keep_buf = !!(entry->hdr.uflags & TCMU_UFLAG_KEEP_BUF);
  1222. if (keep_buf)
  1223. cmd = xa_load(&udev->commands, entry->hdr.cmd_id);
  1224. else
  1225. cmd = xa_erase(&udev->commands, entry->hdr.cmd_id);
  1226. if (!cmd) {
  1227. pr_err("cmd_id %u not found, ring is broken\n",
  1228. entry->hdr.cmd_id);
  1229. set_bit(TCMU_DEV_BIT_BROKEN, &udev->flags);
  1230. return false;
  1231. }
  1232. if (!tcmu_handle_completion(cmd, entry, keep_buf))
  1233. break;
  1234. UPDATE_HEAD(udev->cmdr_last_cleaned,
  1235. tcmu_hdr_get_len(entry->hdr.len_op),
  1236. udev->cmdr_size);
  1237. }
  1238. if (free_space)
  1239. free_space = tcmu_run_tmr_queue(udev);
  1240. if (atomic_read(&global_page_count) > tcmu_global_max_pages &&
  1241. xa_empty(&udev->commands) && list_empty(&udev->qfull_queue)) {
  1242. /*
  1243. * Allocated blocks exceeded global block limit, currently no
  1244. * more pending or waiting commands so try to reclaim blocks.
  1245. */
  1246. schedule_delayed_work(&tcmu_unmap_work, 0);
  1247. }
  1248. if (udev->cmd_time_out)
  1249. tcmu_set_next_deadline(&udev->inflight_queue, &udev->cmd_timer);
  1250. return free_space;
  1251. }
  1252. static void tcmu_check_expired_ring_cmd(struct tcmu_cmd *cmd)
  1253. {
  1254. struct se_cmd *se_cmd;
  1255. if (!time_after_eq(jiffies, cmd->deadline))
  1256. return;
  1257. set_bit(TCMU_CMD_BIT_EXPIRED, &cmd->flags);
  1258. list_del_init(&cmd->queue_entry);
  1259. se_cmd = cmd->se_cmd;
  1260. se_cmd->priv = NULL;
  1261. cmd->se_cmd = NULL;
  1262. pr_debug("Timing out inflight cmd %u on dev %s.\n",
  1263. cmd->cmd_id, cmd->tcmu_dev->name);
  1264. target_complete_cmd(se_cmd, SAM_STAT_CHECK_CONDITION);
  1265. }
  1266. static void tcmu_check_expired_queue_cmd(struct tcmu_cmd *cmd)
  1267. {
  1268. struct se_cmd *se_cmd;
  1269. if (!time_after_eq(jiffies, cmd->deadline))
  1270. return;
  1271. pr_debug("Timing out queued cmd %p on dev %s.\n",
  1272. cmd, cmd->tcmu_dev->name);
  1273. list_del_init(&cmd->queue_entry);
  1274. se_cmd = cmd->se_cmd;
  1275. tcmu_free_cmd(cmd);
  1276. se_cmd->priv = NULL;
  1277. target_complete_cmd(se_cmd, SAM_STAT_TASK_SET_FULL);
  1278. }
  1279. static void tcmu_device_timedout(struct tcmu_dev *udev)
  1280. {
  1281. spin_lock(&timed_out_udevs_lock);
  1282. if (list_empty(&udev->timedout_entry))
  1283. list_add_tail(&udev->timedout_entry, &timed_out_udevs);
  1284. spin_unlock(&timed_out_udevs_lock);
  1285. schedule_delayed_work(&tcmu_unmap_work, 0);
  1286. }
  1287. static void tcmu_cmd_timedout(struct timer_list *t)
  1288. {
  1289. struct tcmu_dev *udev = from_timer(udev, t, cmd_timer);
  1290. pr_debug("%s cmd timeout has expired\n", udev->name);
  1291. tcmu_device_timedout(udev);
  1292. }
  1293. static void tcmu_qfull_timedout(struct timer_list *t)
  1294. {
  1295. struct tcmu_dev *udev = from_timer(udev, t, qfull_timer);
  1296. pr_debug("%s qfull timeout has expired\n", udev->name);
  1297. tcmu_device_timedout(udev);
  1298. }
  1299. static int tcmu_attach_hba(struct se_hba *hba, u32 host_id)
  1300. {
  1301. struct tcmu_hba *tcmu_hba;
  1302. tcmu_hba = kzalloc(sizeof(struct tcmu_hba), GFP_KERNEL);
  1303. if (!tcmu_hba)
  1304. return -ENOMEM;
  1305. tcmu_hba->host_id = host_id;
  1306. hba->hba_ptr = tcmu_hba;
  1307. return 0;
  1308. }
  1309. static void tcmu_detach_hba(struct se_hba *hba)
  1310. {
  1311. kfree(hba->hba_ptr);
  1312. hba->hba_ptr = NULL;
  1313. }
  1314. static struct se_device *tcmu_alloc_device(struct se_hba *hba, const char *name)
  1315. {
  1316. struct tcmu_dev *udev;
  1317. udev = kzalloc(sizeof(struct tcmu_dev), GFP_KERNEL);
  1318. if (!udev)
  1319. return NULL;
  1320. kref_init(&udev->kref);
  1321. udev->name = kstrdup(name, GFP_KERNEL);
  1322. if (!udev->name) {
  1323. kfree(udev);
  1324. return NULL;
  1325. }
  1326. udev->hba = hba;
  1327. udev->cmd_time_out = TCMU_TIME_OUT;
  1328. udev->qfull_time_out = -1;
  1329. udev->data_pages_per_blk = DATA_PAGES_PER_BLK_DEF;
  1330. udev->max_blocks = DATA_AREA_PAGES_DEF / udev->data_pages_per_blk;
  1331. udev->cmdr_size = CMDR_SIZE_DEF;
  1332. udev->data_area_mb = TCMU_PAGES_TO_MBS(DATA_AREA_PAGES_DEF);
  1333. mutex_init(&udev->cmdr_lock);
  1334. INIT_LIST_HEAD(&udev->node);
  1335. INIT_LIST_HEAD(&udev->timedout_entry);
  1336. INIT_LIST_HEAD(&udev->qfull_queue);
  1337. INIT_LIST_HEAD(&udev->tmr_queue);
  1338. INIT_LIST_HEAD(&udev->inflight_queue);
  1339. xa_init_flags(&udev->commands, XA_FLAGS_ALLOC1);
  1340. timer_setup(&udev->qfull_timer, tcmu_qfull_timedout, 0);
  1341. timer_setup(&udev->cmd_timer, tcmu_cmd_timedout, 0);
  1342. xa_init(&udev->data_pages);
  1343. return &udev->se_dev;
  1344. }
  1345. static void tcmu_dev_call_rcu(struct rcu_head *p)
  1346. {
  1347. struct se_device *dev = container_of(p, struct se_device, rcu_head);
  1348. struct tcmu_dev *udev = TCMU_DEV(dev);
  1349. kfree(udev->uio_info.name);
  1350. kfree(udev->name);
  1351. kfree(udev);
  1352. }
  1353. static int tcmu_check_and_free_pending_cmd(struct tcmu_cmd *cmd)
  1354. {
  1355. if (test_bit(TCMU_CMD_BIT_EXPIRED, &cmd->flags) ||
  1356. test_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags)) {
  1357. kmem_cache_free(tcmu_cmd_cache, cmd);
  1358. return 0;
  1359. }
  1360. return -EINVAL;
  1361. }
  1362. static u32 tcmu_blocks_release(struct tcmu_dev *udev, unsigned long first,
  1363. unsigned long last)
  1364. {
  1365. struct page *page;
  1366. unsigned long dpi;
  1367. u32 pages_freed = 0;
  1368. first = first * udev->data_pages_per_blk;
  1369. last = (last + 1) * udev->data_pages_per_blk - 1;
  1370. xa_for_each_range(&udev->data_pages, dpi, page, first, last) {
  1371. xa_erase(&udev->data_pages, dpi);
  1372. /*
  1373. * While reaching here there may be page faults occurring on
  1374. * the to-be-released pages. A race condition may occur if
  1375. * unmap_mapping_range() is called before page faults on these
  1376. * pages have completed; a valid but stale map is created.
  1377. *
  1378. * If another command subsequently runs and needs to extend
  1379. * dbi_thresh, it may reuse the slot corresponding to the
  1380. * previous page in data_bitmap. Though we will allocate a new
  1381. * page for the slot in data_area, no page fault will happen
  1382. * because we have a valid map. Therefore the command's data
  1383. * will be lost.
  1384. *
  1385. * We lock and unlock pages that are to be released to ensure
  1386. * all page faults have completed. This way
  1387. * unmap_mapping_range() can ensure stale maps are cleanly
  1388. * removed.
  1389. */
  1390. lock_page(page);
  1391. unlock_page(page);
  1392. __free_page(page);
  1393. pages_freed++;
  1394. }
  1395. atomic_sub(pages_freed, &global_page_count);
  1396. return pages_freed;
  1397. }
  1398. static void tcmu_remove_all_queued_tmr(struct tcmu_dev *udev)
  1399. {
  1400. struct tcmu_tmr *tmr, *tmp;
  1401. list_for_each_entry_safe(tmr, tmp, &udev->tmr_queue, queue_entry) {
  1402. list_del_init(&tmr->queue_entry);
  1403. kfree(tmr);
  1404. }
  1405. }
  1406. static void tcmu_dev_kref_release(struct kref *kref)
  1407. {
  1408. struct tcmu_dev *udev = container_of(kref, struct tcmu_dev, kref);
  1409. struct se_device *dev = &udev->se_dev;
  1410. struct tcmu_cmd *cmd;
  1411. bool all_expired = true;
  1412. unsigned long i;
  1413. vfree(udev->mb_addr);
  1414. udev->mb_addr = NULL;
  1415. spin_lock_bh(&timed_out_udevs_lock);
  1416. if (!list_empty(&udev->timedout_entry))
  1417. list_del(&udev->timedout_entry);
  1418. spin_unlock_bh(&timed_out_udevs_lock);
  1419. /* Upper layer should drain all requests before calling this */
  1420. mutex_lock(&udev->cmdr_lock);
  1421. xa_for_each(&udev->commands, i, cmd) {
  1422. if (tcmu_check_and_free_pending_cmd(cmd) != 0)
  1423. all_expired = false;
  1424. }
  1425. /* There can be left over TMR cmds. Remove them. */
  1426. tcmu_remove_all_queued_tmr(udev);
  1427. if (!list_empty(&udev->qfull_queue))
  1428. all_expired = false;
  1429. xa_destroy(&udev->commands);
  1430. WARN_ON(!all_expired);
  1431. tcmu_blocks_release(udev, 0, udev->dbi_max);
  1432. bitmap_free(udev->data_bitmap);
  1433. mutex_unlock(&udev->cmdr_lock);
  1434. pr_debug("dev_kref_release\n");
  1435. call_rcu(&dev->rcu_head, tcmu_dev_call_rcu);
  1436. }
  1437. static void run_qfull_queue(struct tcmu_dev *udev, bool fail)
  1438. {
  1439. struct tcmu_cmd *tcmu_cmd, *tmp_cmd;
  1440. LIST_HEAD(cmds);
  1441. sense_reason_t scsi_ret;
  1442. int ret;
  1443. if (list_empty(&udev->qfull_queue))
  1444. return;
  1445. pr_debug("running %s's cmdr queue forcefail %d\n", udev->name, fail);
  1446. list_splice_init(&udev->qfull_queue, &cmds);
  1447. list_for_each_entry_safe(tcmu_cmd, tmp_cmd, &cmds, queue_entry) {
  1448. list_del_init(&tcmu_cmd->queue_entry);
  1449. pr_debug("removing cmd %p on dev %s from queue\n",
  1450. tcmu_cmd, udev->name);
  1451. if (fail) {
  1452. /*
  1453. * We were not able to even start the command, so
  1454. * fail with busy to allow a retry in case runner
  1455. * was only temporarily down. If the device is being
  1456. * removed then LIO core will do the right thing and
  1457. * fail the retry.
  1458. */
  1459. tcmu_cmd->se_cmd->priv = NULL;
  1460. target_complete_cmd(tcmu_cmd->se_cmd, SAM_STAT_BUSY);
  1461. tcmu_free_cmd(tcmu_cmd);
  1462. continue;
  1463. }
  1464. ret = queue_cmd_ring(tcmu_cmd, &scsi_ret);
  1465. if (ret < 0) {
  1466. pr_debug("cmd %p on dev %s failed with %u\n",
  1467. tcmu_cmd, udev->name, scsi_ret);
  1468. /*
  1469. * Ignore scsi_ret for now. target_complete_cmd
  1470. * drops it.
  1471. */
  1472. tcmu_cmd->se_cmd->priv = NULL;
  1473. target_complete_cmd(tcmu_cmd->se_cmd,
  1474. SAM_STAT_CHECK_CONDITION);
  1475. tcmu_free_cmd(tcmu_cmd);
  1476. } else if (ret > 0) {
  1477. pr_debug("ran out of space during cmdr queue run\n");
  1478. /*
  1479. * cmd was requeued, so just put all cmds back in
  1480. * the queue
  1481. */
  1482. list_splice_tail(&cmds, &udev->qfull_queue);
  1483. break;
  1484. }
  1485. }
  1486. tcmu_set_next_deadline(&udev->qfull_queue, &udev->qfull_timer);
  1487. }
  1488. static int tcmu_irqcontrol(struct uio_info *info, s32 irq_on)
  1489. {
  1490. struct tcmu_dev *udev = container_of(info, struct tcmu_dev, uio_info);
  1491. mutex_lock(&udev->cmdr_lock);
  1492. if (tcmu_handle_completions(udev))
  1493. run_qfull_queue(udev, false);
  1494. mutex_unlock(&udev->cmdr_lock);
  1495. return 0;
  1496. }
  1497. /*
  1498. * mmap code from uio.c. Copied here because we want to hook mmap()
  1499. * and this stuff must come along.
  1500. */
  1501. static int tcmu_find_mem_index(struct vm_area_struct *vma)
  1502. {
  1503. struct tcmu_dev *udev = vma->vm_private_data;
  1504. struct uio_info *info = &udev->uio_info;
  1505. if (vma->vm_pgoff < MAX_UIO_MAPS) {
  1506. if (info->mem[vma->vm_pgoff].size == 0)
  1507. return -1;
  1508. return (int)vma->vm_pgoff;
  1509. }
  1510. return -1;
  1511. }
  1512. static struct page *tcmu_try_get_data_page(struct tcmu_dev *udev, uint32_t dpi)
  1513. {
  1514. struct page *page;
  1515. mutex_lock(&udev->cmdr_lock);
  1516. page = xa_load(&udev->data_pages, dpi);
  1517. if (likely(page)) {
  1518. get_page(page);
  1519. lock_page(page);
  1520. mutex_unlock(&udev->cmdr_lock);
  1521. return page;
  1522. }
  1523. /*
  1524. * Userspace messed up and passed in a address not in the
  1525. * data iov passed to it.
  1526. */
  1527. pr_err("Invalid addr to data page mapping (dpi %u) on device %s\n",
  1528. dpi, udev->name);
  1529. mutex_unlock(&udev->cmdr_lock);
  1530. return NULL;
  1531. }
  1532. static void tcmu_vma_open(struct vm_area_struct *vma)
  1533. {
  1534. struct tcmu_dev *udev = vma->vm_private_data;
  1535. pr_debug("vma_open\n");
  1536. kref_get(&udev->kref);
  1537. }
  1538. static void tcmu_vma_close(struct vm_area_struct *vma)
  1539. {
  1540. struct tcmu_dev *udev = vma->vm_private_data;
  1541. pr_debug("vma_close\n");
  1542. /* release ref from tcmu_vma_open */
  1543. kref_put(&udev->kref, tcmu_dev_kref_release);
  1544. }
  1545. static vm_fault_t tcmu_vma_fault(struct vm_fault *vmf)
  1546. {
  1547. struct tcmu_dev *udev = vmf->vma->vm_private_data;
  1548. struct uio_info *info = &udev->uio_info;
  1549. struct page *page;
  1550. unsigned long offset;
  1551. void *addr;
  1552. vm_fault_t ret = 0;
  1553. int mi = tcmu_find_mem_index(vmf->vma);
  1554. if (mi < 0)
  1555. return VM_FAULT_SIGBUS;
  1556. /*
  1557. * We need to subtract mi because userspace uses offset = N*PAGE_SIZE
  1558. * to use mem[N].
  1559. */
  1560. offset = (vmf->pgoff - mi) << PAGE_SHIFT;
  1561. if (offset < udev->data_off) {
  1562. /* For the vmalloc()ed cmd area pages */
  1563. addr = (void *)(unsigned long)info->mem[mi].addr + offset;
  1564. page = vmalloc_to_page(addr);
  1565. get_page(page);
  1566. } else {
  1567. uint32_t dpi;
  1568. /* For the dynamically growing data area pages */
  1569. dpi = (offset - udev->data_off) / PAGE_SIZE;
  1570. page = tcmu_try_get_data_page(udev, dpi);
  1571. if (!page)
  1572. return VM_FAULT_SIGBUS;
  1573. ret = VM_FAULT_LOCKED;
  1574. }
  1575. vmf->page = page;
  1576. return ret;
  1577. }
  1578. static const struct vm_operations_struct tcmu_vm_ops = {
  1579. .open = tcmu_vma_open,
  1580. .close = tcmu_vma_close,
  1581. .fault = tcmu_vma_fault,
  1582. };
  1583. static int tcmu_mmap(struct uio_info *info, struct vm_area_struct *vma)
  1584. {
  1585. struct tcmu_dev *udev = container_of(info, struct tcmu_dev, uio_info);
  1586. vm_flags_set(vma, VM_DONTEXPAND | VM_DONTDUMP);
  1587. vma->vm_ops = &tcmu_vm_ops;
  1588. vma->vm_private_data = udev;
  1589. /* Ensure the mmap is exactly the right size */
  1590. if (vma_pages(vma) != udev->mmap_pages)
  1591. return -EINVAL;
  1592. tcmu_vma_open(vma);
  1593. return 0;
  1594. }
  1595. static int tcmu_open(struct uio_info *info, struct inode *inode)
  1596. {
  1597. struct tcmu_dev *udev = container_of(info, struct tcmu_dev, uio_info);
  1598. /* O_EXCL not supported for char devs, so fake it? */
  1599. if (test_and_set_bit(TCMU_DEV_BIT_OPEN, &udev->flags))
  1600. return -EBUSY;
  1601. udev->inode = inode;
  1602. pr_debug("open\n");
  1603. return 0;
  1604. }
  1605. static int tcmu_release(struct uio_info *info, struct inode *inode)
  1606. {
  1607. struct tcmu_dev *udev = container_of(info, struct tcmu_dev, uio_info);
  1608. struct tcmu_cmd *cmd;
  1609. unsigned long i;
  1610. bool freed = false;
  1611. mutex_lock(&udev->cmdr_lock);
  1612. xa_for_each(&udev->commands, i, cmd) {
  1613. /* Cmds with KEEP_BUF set are no longer on the ring, but
  1614. * userspace still holds the data buffer. If userspace closes
  1615. * we implicitly free these cmds and buffers, since after new
  1616. * open the (new ?) userspace cannot find the cmd in the ring
  1617. * and thus never will release the buffer by writing cmd_id to
  1618. * free_kept_buf action attribute.
  1619. */
  1620. if (!test_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags))
  1621. continue;
  1622. pr_debug("removing KEEP_BUF cmd %u on dev %s from ring\n",
  1623. cmd->cmd_id, udev->name);
  1624. freed = true;
  1625. xa_erase(&udev->commands, i);
  1626. tcmu_cmd_free_data(cmd, cmd->dbi_cnt);
  1627. tcmu_free_cmd(cmd);
  1628. }
  1629. /*
  1630. * We only freed data space, not ring space. Therefore we dont call
  1631. * run_tmr_queue, but call run_qfull_queue if tmr_list is empty.
  1632. */
  1633. if (freed && list_empty(&udev->tmr_queue))
  1634. run_qfull_queue(udev, false);
  1635. mutex_unlock(&udev->cmdr_lock);
  1636. clear_bit(TCMU_DEV_BIT_OPEN, &udev->flags);
  1637. pr_debug("close\n");
  1638. return 0;
  1639. }
  1640. static int tcmu_init_genl_cmd_reply(struct tcmu_dev *udev, int cmd)
  1641. {
  1642. struct tcmu_nl_cmd *nl_cmd = &udev->curr_nl_cmd;
  1643. if (!tcmu_kern_cmd_reply_supported)
  1644. return 0;
  1645. if (udev->nl_reply_supported <= 0)
  1646. return 0;
  1647. mutex_lock(&tcmu_nl_cmd_mutex);
  1648. if (tcmu_netlink_blocked) {
  1649. mutex_unlock(&tcmu_nl_cmd_mutex);
  1650. pr_warn("Failing nl cmd %d on %s. Interface is blocked.\n", cmd,
  1651. udev->name);
  1652. return -EAGAIN;
  1653. }
  1654. if (nl_cmd->cmd != TCMU_CMD_UNSPEC) {
  1655. mutex_unlock(&tcmu_nl_cmd_mutex);
  1656. pr_warn("netlink cmd %d already executing on %s\n",
  1657. nl_cmd->cmd, udev->name);
  1658. return -EBUSY;
  1659. }
  1660. memset(nl_cmd, 0, sizeof(*nl_cmd));
  1661. nl_cmd->cmd = cmd;
  1662. nl_cmd->udev = udev;
  1663. init_completion(&nl_cmd->complete);
  1664. INIT_LIST_HEAD(&nl_cmd->nl_list);
  1665. list_add_tail(&nl_cmd->nl_list, &tcmu_nl_cmd_list);
  1666. mutex_unlock(&tcmu_nl_cmd_mutex);
  1667. return 0;
  1668. }
  1669. static void tcmu_destroy_genl_cmd_reply(struct tcmu_dev *udev)
  1670. {
  1671. struct tcmu_nl_cmd *nl_cmd = &udev->curr_nl_cmd;
  1672. if (!tcmu_kern_cmd_reply_supported)
  1673. return;
  1674. if (udev->nl_reply_supported <= 0)
  1675. return;
  1676. mutex_lock(&tcmu_nl_cmd_mutex);
  1677. list_del(&nl_cmd->nl_list);
  1678. memset(nl_cmd, 0, sizeof(*nl_cmd));
  1679. mutex_unlock(&tcmu_nl_cmd_mutex);
  1680. }
  1681. static int tcmu_wait_genl_cmd_reply(struct tcmu_dev *udev)
  1682. {
  1683. struct tcmu_nl_cmd *nl_cmd = &udev->curr_nl_cmd;
  1684. int ret;
  1685. if (!tcmu_kern_cmd_reply_supported)
  1686. return 0;
  1687. if (udev->nl_reply_supported <= 0)
  1688. return 0;
  1689. pr_debug("sleeping for nl reply\n");
  1690. wait_for_completion(&nl_cmd->complete);
  1691. mutex_lock(&tcmu_nl_cmd_mutex);
  1692. nl_cmd->cmd = TCMU_CMD_UNSPEC;
  1693. ret = nl_cmd->status;
  1694. mutex_unlock(&tcmu_nl_cmd_mutex);
  1695. return ret;
  1696. }
  1697. static int tcmu_netlink_event_init(struct tcmu_dev *udev,
  1698. enum tcmu_genl_cmd cmd,
  1699. struct sk_buff **buf, void **hdr)
  1700. {
  1701. struct sk_buff *skb;
  1702. void *msg_header;
  1703. int ret = -ENOMEM;
  1704. skb = genlmsg_new(NLMSG_GOODSIZE, GFP_KERNEL);
  1705. if (!skb)
  1706. return ret;
  1707. msg_header = genlmsg_put(skb, 0, 0, &tcmu_genl_family, 0, cmd);
  1708. if (!msg_header)
  1709. goto free_skb;
  1710. ret = nla_put_string(skb, TCMU_ATTR_DEVICE, udev->uio_info.name);
  1711. if (ret < 0)
  1712. goto free_skb;
  1713. ret = nla_put_u32(skb, TCMU_ATTR_MINOR, udev->uio_info.uio_dev->minor);
  1714. if (ret < 0)
  1715. goto free_skb;
  1716. ret = nla_put_u32(skb, TCMU_ATTR_DEVICE_ID, udev->se_dev.dev_index);
  1717. if (ret < 0)
  1718. goto free_skb;
  1719. *buf = skb;
  1720. *hdr = msg_header;
  1721. return ret;
  1722. free_skb:
  1723. nlmsg_free(skb);
  1724. return ret;
  1725. }
  1726. static int tcmu_netlink_event_send(struct tcmu_dev *udev,
  1727. enum tcmu_genl_cmd cmd,
  1728. struct sk_buff *skb, void *msg_header)
  1729. {
  1730. int ret;
  1731. genlmsg_end(skb, msg_header);
  1732. ret = tcmu_init_genl_cmd_reply(udev, cmd);
  1733. if (ret) {
  1734. nlmsg_free(skb);
  1735. return ret;
  1736. }
  1737. ret = genlmsg_multicast_allns(&tcmu_genl_family, skb, 0,
  1738. TCMU_MCGRP_CONFIG);
  1739. /* Wait during an add as the listener may not be up yet */
  1740. if (ret == 0 ||
  1741. (ret == -ESRCH && cmd == TCMU_CMD_ADDED_DEVICE))
  1742. return tcmu_wait_genl_cmd_reply(udev);
  1743. else
  1744. tcmu_destroy_genl_cmd_reply(udev);
  1745. return ret;
  1746. }
  1747. static int tcmu_send_dev_add_event(struct tcmu_dev *udev)
  1748. {
  1749. struct sk_buff *skb = NULL;
  1750. void *msg_header = NULL;
  1751. int ret = 0;
  1752. ret = tcmu_netlink_event_init(udev, TCMU_CMD_ADDED_DEVICE, &skb,
  1753. &msg_header);
  1754. if (ret < 0)
  1755. return ret;
  1756. return tcmu_netlink_event_send(udev, TCMU_CMD_ADDED_DEVICE, skb,
  1757. msg_header);
  1758. }
  1759. static int tcmu_send_dev_remove_event(struct tcmu_dev *udev)
  1760. {
  1761. struct sk_buff *skb = NULL;
  1762. void *msg_header = NULL;
  1763. int ret = 0;
  1764. ret = tcmu_netlink_event_init(udev, TCMU_CMD_REMOVED_DEVICE,
  1765. &skb, &msg_header);
  1766. if (ret < 0)
  1767. return ret;
  1768. return tcmu_netlink_event_send(udev, TCMU_CMD_REMOVED_DEVICE,
  1769. skb, msg_header);
  1770. }
  1771. static int tcmu_update_uio_info(struct tcmu_dev *udev)
  1772. {
  1773. struct tcmu_hba *hba = udev->hba->hba_ptr;
  1774. struct uio_info *info;
  1775. char *str;
  1776. info = &udev->uio_info;
  1777. if (udev->dev_config[0])
  1778. str = kasprintf(GFP_KERNEL, "tcm-user/%u/%s/%s", hba->host_id,
  1779. udev->name, udev->dev_config);
  1780. else
  1781. str = kasprintf(GFP_KERNEL, "tcm-user/%u/%s", hba->host_id,
  1782. udev->name);
  1783. if (!str)
  1784. return -ENOMEM;
  1785. /* If the old string exists, free it */
  1786. kfree(info->name);
  1787. info->name = str;
  1788. return 0;
  1789. }
  1790. static int tcmu_configure_device(struct se_device *dev)
  1791. {
  1792. struct tcmu_dev *udev = TCMU_DEV(dev);
  1793. struct uio_info *info;
  1794. struct tcmu_mailbox *mb;
  1795. size_t data_size;
  1796. int ret = 0;
  1797. ret = tcmu_update_uio_info(udev);
  1798. if (ret)
  1799. return ret;
  1800. info = &udev->uio_info;
  1801. mutex_lock(&udev->cmdr_lock);
  1802. udev->data_bitmap = bitmap_zalloc(udev->max_blocks, GFP_KERNEL);
  1803. mutex_unlock(&udev->cmdr_lock);
  1804. if (!udev->data_bitmap) {
  1805. ret = -ENOMEM;
  1806. goto err_bitmap_alloc;
  1807. }
  1808. mb = vzalloc(udev->cmdr_size + CMDR_OFF);
  1809. if (!mb) {
  1810. ret = -ENOMEM;
  1811. goto err_vzalloc;
  1812. }
  1813. /* mailbox fits in first part of CMDR space */
  1814. udev->mb_addr = mb;
  1815. udev->cmdr = (void *)mb + CMDR_OFF;
  1816. udev->data_off = udev->cmdr_size + CMDR_OFF;
  1817. data_size = TCMU_MBS_TO_PAGES(udev->data_area_mb) << PAGE_SHIFT;
  1818. udev->mmap_pages = (data_size + udev->cmdr_size + CMDR_OFF) >> PAGE_SHIFT;
  1819. udev->data_blk_size = udev->data_pages_per_blk * PAGE_SIZE;
  1820. udev->dbi_thresh = 0; /* Default in Idle state */
  1821. /* Initialise the mailbox of the ring buffer */
  1822. mb->version = TCMU_MAILBOX_VERSION;
  1823. mb->flags = TCMU_MAILBOX_FLAG_CAP_OOOC |
  1824. TCMU_MAILBOX_FLAG_CAP_READ_LEN |
  1825. TCMU_MAILBOX_FLAG_CAP_TMR |
  1826. TCMU_MAILBOX_FLAG_CAP_KEEP_BUF;
  1827. mb->cmdr_off = CMDR_OFF;
  1828. mb->cmdr_size = udev->cmdr_size;
  1829. WARN_ON(!PAGE_ALIGNED(udev->data_off));
  1830. WARN_ON(data_size % PAGE_SIZE);
  1831. info->version = __stringify(TCMU_MAILBOX_VERSION);
  1832. info->mem[0].name = "tcm-user command & data buffer";
  1833. info->mem[0].addr = (phys_addr_t)(uintptr_t)udev->mb_addr;
  1834. info->mem[0].size = data_size + udev->cmdr_size + CMDR_OFF;
  1835. info->mem[0].memtype = UIO_MEM_NONE;
  1836. info->irqcontrol = tcmu_irqcontrol;
  1837. info->irq = UIO_IRQ_CUSTOM;
  1838. info->mmap = tcmu_mmap;
  1839. info->open = tcmu_open;
  1840. info->release = tcmu_release;
  1841. ret = uio_register_device(tcmu_root_device, info);
  1842. if (ret)
  1843. goto err_register;
  1844. /* User can set hw_block_size before enable the device */
  1845. if (dev->dev_attrib.hw_block_size == 0)
  1846. dev->dev_attrib.hw_block_size = 512;
  1847. /* Other attributes can be configured in userspace */
  1848. if (!dev->dev_attrib.hw_max_sectors)
  1849. dev->dev_attrib.hw_max_sectors = 128;
  1850. if (!dev->dev_attrib.emulate_write_cache)
  1851. dev->dev_attrib.emulate_write_cache = 0;
  1852. dev->dev_attrib.hw_queue_depth = 128;
  1853. /* If user didn't explicitly disable netlink reply support, use
  1854. * module scope setting.
  1855. */
  1856. if (udev->nl_reply_supported >= 0)
  1857. udev->nl_reply_supported = tcmu_kern_cmd_reply_supported;
  1858. /*
  1859. * Get a ref incase userspace does a close on the uio device before
  1860. * LIO has initiated tcmu_free_device.
  1861. */
  1862. kref_get(&udev->kref);
  1863. ret = tcmu_send_dev_add_event(udev);
  1864. if (ret)
  1865. goto err_netlink;
  1866. mutex_lock(&root_udev_mutex);
  1867. list_add(&udev->node, &root_udev);
  1868. mutex_unlock(&root_udev_mutex);
  1869. return 0;
  1870. err_netlink:
  1871. kref_put(&udev->kref, tcmu_dev_kref_release);
  1872. uio_unregister_device(&udev->uio_info);
  1873. err_register:
  1874. vfree(udev->mb_addr);
  1875. udev->mb_addr = NULL;
  1876. err_vzalloc:
  1877. bitmap_free(udev->data_bitmap);
  1878. udev->data_bitmap = NULL;
  1879. err_bitmap_alloc:
  1880. kfree(info->name);
  1881. info->name = NULL;
  1882. return ret;
  1883. }
  1884. static void tcmu_free_device(struct se_device *dev)
  1885. {
  1886. struct tcmu_dev *udev = TCMU_DEV(dev);
  1887. /* release ref from init */
  1888. kref_put(&udev->kref, tcmu_dev_kref_release);
  1889. }
  1890. static void tcmu_destroy_device(struct se_device *dev)
  1891. {
  1892. struct tcmu_dev *udev = TCMU_DEV(dev);
  1893. del_timer_sync(&udev->cmd_timer);
  1894. del_timer_sync(&udev->qfull_timer);
  1895. mutex_lock(&root_udev_mutex);
  1896. list_del(&udev->node);
  1897. mutex_unlock(&root_udev_mutex);
  1898. tcmu_send_dev_remove_event(udev);
  1899. uio_unregister_device(&udev->uio_info);
  1900. /* release ref from configure */
  1901. kref_put(&udev->kref, tcmu_dev_kref_release);
  1902. }
  1903. static void tcmu_unblock_dev(struct tcmu_dev *udev)
  1904. {
  1905. mutex_lock(&udev->cmdr_lock);
  1906. clear_bit(TCMU_DEV_BIT_BLOCKED, &udev->flags);
  1907. mutex_unlock(&udev->cmdr_lock);
  1908. }
  1909. static void tcmu_block_dev(struct tcmu_dev *udev)
  1910. {
  1911. mutex_lock(&udev->cmdr_lock);
  1912. if (test_and_set_bit(TCMU_DEV_BIT_BLOCKED, &udev->flags))
  1913. goto unlock;
  1914. /* complete IO that has executed successfully */
  1915. tcmu_handle_completions(udev);
  1916. /* fail IO waiting to be queued */
  1917. run_qfull_queue(udev, true);
  1918. unlock:
  1919. mutex_unlock(&udev->cmdr_lock);
  1920. }
  1921. static void tcmu_reset_ring(struct tcmu_dev *udev, u8 err_level)
  1922. {
  1923. struct tcmu_mailbox *mb;
  1924. struct tcmu_cmd *cmd;
  1925. unsigned long i;
  1926. mutex_lock(&udev->cmdr_lock);
  1927. xa_for_each(&udev->commands, i, cmd) {
  1928. pr_debug("removing cmd %u on dev %s from ring %s\n",
  1929. cmd->cmd_id, udev->name,
  1930. test_bit(TCMU_CMD_BIT_EXPIRED, &cmd->flags) ?
  1931. "(is expired)" :
  1932. (test_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags) ?
  1933. "(is keep buffer)" : ""));
  1934. xa_erase(&udev->commands, i);
  1935. if (!test_bit(TCMU_CMD_BIT_EXPIRED, &cmd->flags) &&
  1936. !test_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags)) {
  1937. WARN_ON(!cmd->se_cmd);
  1938. list_del_init(&cmd->queue_entry);
  1939. cmd->se_cmd->priv = NULL;
  1940. if (err_level == 1) {
  1941. /*
  1942. * Userspace was not able to start the
  1943. * command or it is retryable.
  1944. */
  1945. target_complete_cmd(cmd->se_cmd, SAM_STAT_BUSY);
  1946. } else {
  1947. /* hard failure */
  1948. target_complete_cmd(cmd->se_cmd,
  1949. SAM_STAT_CHECK_CONDITION);
  1950. }
  1951. }
  1952. tcmu_cmd_free_data(cmd, cmd->dbi_cnt);
  1953. tcmu_free_cmd(cmd);
  1954. }
  1955. mb = udev->mb_addr;
  1956. tcmu_flush_dcache_range(mb, sizeof(*mb));
  1957. pr_debug("mb last %u head %u tail %u\n", udev->cmdr_last_cleaned,
  1958. mb->cmd_tail, mb->cmd_head);
  1959. udev->cmdr_last_cleaned = 0;
  1960. mb->cmd_tail = 0;
  1961. mb->cmd_head = 0;
  1962. tcmu_flush_dcache_range(mb, sizeof(*mb));
  1963. clear_bit(TCMU_DEV_BIT_BROKEN, &udev->flags);
  1964. del_timer(&udev->cmd_timer);
  1965. /*
  1966. * ring is empty and qfull queue never contains aborted commands.
  1967. * So TMRs in tmr queue do not contain relevant cmd_ids.
  1968. * After a ring reset userspace should do a fresh start, so
  1969. * even LUN RESET message is no longer relevant.
  1970. * Therefore remove all TMRs from qfull queue
  1971. */
  1972. tcmu_remove_all_queued_tmr(udev);
  1973. run_qfull_queue(udev, false);
  1974. mutex_unlock(&udev->cmdr_lock);
  1975. }
  1976. enum {
  1977. Opt_dev_config, Opt_dev_size, Opt_hw_block_size, Opt_hw_max_sectors,
  1978. Opt_nl_reply_supported, Opt_max_data_area_mb, Opt_data_pages_per_blk,
  1979. Opt_cmd_ring_size_mb, Opt_err,
  1980. };
  1981. static match_table_t tokens = {
  1982. {Opt_dev_config, "dev_config=%s"},
  1983. {Opt_dev_size, "dev_size=%s"},
  1984. {Opt_hw_block_size, "hw_block_size=%d"},
  1985. {Opt_hw_max_sectors, "hw_max_sectors=%d"},
  1986. {Opt_nl_reply_supported, "nl_reply_supported=%d"},
  1987. {Opt_max_data_area_mb, "max_data_area_mb=%d"},
  1988. {Opt_data_pages_per_blk, "data_pages_per_blk=%d"},
  1989. {Opt_cmd_ring_size_mb, "cmd_ring_size_mb=%d"},
  1990. {Opt_err, NULL}
  1991. };
  1992. static int tcmu_set_dev_attrib(substring_t *arg, u32 *dev_attrib)
  1993. {
  1994. int val, ret;
  1995. ret = match_int(arg, &val);
  1996. if (ret < 0) {
  1997. pr_err("match_int() failed for dev attrib. Error %d.\n",
  1998. ret);
  1999. return ret;
  2000. }
  2001. if (val <= 0) {
  2002. pr_err("Invalid dev attrib value %d. Must be greater than zero.\n",
  2003. val);
  2004. return -EINVAL;
  2005. }
  2006. *dev_attrib = val;
  2007. return 0;
  2008. }
  2009. static int tcmu_set_max_blocks_param(struct tcmu_dev *udev, substring_t *arg)
  2010. {
  2011. int val, ret;
  2012. uint32_t pages_per_blk = udev->data_pages_per_blk;
  2013. ret = match_int(arg, &val);
  2014. if (ret < 0) {
  2015. pr_err("match_int() failed for max_data_area_mb=. Error %d.\n",
  2016. ret);
  2017. return ret;
  2018. }
  2019. if (val <= 0) {
  2020. pr_err("Invalid max_data_area %d.\n", val);
  2021. return -EINVAL;
  2022. }
  2023. if (val > TCMU_PAGES_TO_MBS(tcmu_global_max_pages)) {
  2024. pr_err("%d is too large. Adjusting max_data_area_mb to global limit of %u\n",
  2025. val, TCMU_PAGES_TO_MBS(tcmu_global_max_pages));
  2026. val = TCMU_PAGES_TO_MBS(tcmu_global_max_pages);
  2027. }
  2028. if (TCMU_MBS_TO_PAGES(val) < pages_per_blk) {
  2029. pr_err("Invalid max_data_area %d (%zu pages): smaller than data_pages_per_blk (%u pages).\n",
  2030. val, TCMU_MBS_TO_PAGES(val), pages_per_blk);
  2031. return -EINVAL;
  2032. }
  2033. mutex_lock(&udev->cmdr_lock);
  2034. if (udev->data_bitmap) {
  2035. pr_err("Cannot set max_data_area_mb after it has been enabled.\n");
  2036. ret = -EINVAL;
  2037. goto unlock;
  2038. }
  2039. udev->data_area_mb = val;
  2040. udev->max_blocks = TCMU_MBS_TO_PAGES(val) / pages_per_blk;
  2041. unlock:
  2042. mutex_unlock(&udev->cmdr_lock);
  2043. return ret;
  2044. }
  2045. static int tcmu_set_data_pages_per_blk(struct tcmu_dev *udev, substring_t *arg)
  2046. {
  2047. int val, ret;
  2048. ret = match_int(arg, &val);
  2049. if (ret < 0) {
  2050. pr_err("match_int() failed for data_pages_per_blk=. Error %d.\n",
  2051. ret);
  2052. return ret;
  2053. }
  2054. if (val > TCMU_MBS_TO_PAGES(udev->data_area_mb)) {
  2055. pr_err("Invalid data_pages_per_blk %d: greater than max_data_area_mb %d -> %zd pages).\n",
  2056. val, udev->data_area_mb,
  2057. TCMU_MBS_TO_PAGES(udev->data_area_mb));
  2058. return -EINVAL;
  2059. }
  2060. mutex_lock(&udev->cmdr_lock);
  2061. if (udev->data_bitmap) {
  2062. pr_err("Cannot set data_pages_per_blk after it has been enabled.\n");
  2063. ret = -EINVAL;
  2064. goto unlock;
  2065. }
  2066. udev->data_pages_per_blk = val;
  2067. udev->max_blocks = TCMU_MBS_TO_PAGES(udev->data_area_mb) / val;
  2068. unlock:
  2069. mutex_unlock(&udev->cmdr_lock);
  2070. return ret;
  2071. }
  2072. static int tcmu_set_cmd_ring_size(struct tcmu_dev *udev, substring_t *arg)
  2073. {
  2074. int val, ret;
  2075. ret = match_int(arg, &val);
  2076. if (ret < 0) {
  2077. pr_err("match_int() failed for cmd_ring_size_mb=. Error %d.\n",
  2078. ret);
  2079. return ret;
  2080. }
  2081. if (val <= 0) {
  2082. pr_err("Invalid cmd_ring_size_mb %d.\n", val);
  2083. return -EINVAL;
  2084. }
  2085. mutex_lock(&udev->cmdr_lock);
  2086. if (udev->data_bitmap) {
  2087. pr_err("Cannot set cmd_ring_size_mb after it has been enabled.\n");
  2088. ret = -EINVAL;
  2089. goto unlock;
  2090. }
  2091. udev->cmdr_size = (val << 20) - CMDR_OFF;
  2092. if (val > (MB_CMDR_SIZE_DEF >> 20)) {
  2093. pr_err("%d is too large. Adjusting cmd_ring_size_mb to global limit of %u\n",
  2094. val, (MB_CMDR_SIZE_DEF >> 20));
  2095. udev->cmdr_size = CMDR_SIZE_DEF;
  2096. }
  2097. unlock:
  2098. mutex_unlock(&udev->cmdr_lock);
  2099. return ret;
  2100. }
  2101. static ssize_t tcmu_set_configfs_dev_params(struct se_device *dev,
  2102. const char *page, ssize_t count)
  2103. {
  2104. struct tcmu_dev *udev = TCMU_DEV(dev);
  2105. char *orig, *ptr, *opts;
  2106. substring_t args[MAX_OPT_ARGS];
  2107. int ret = 0, token;
  2108. opts = kstrdup(page, GFP_KERNEL);
  2109. if (!opts)
  2110. return -ENOMEM;
  2111. orig = opts;
  2112. while ((ptr = strsep(&opts, ",\n")) != NULL) {
  2113. if (!*ptr)
  2114. continue;
  2115. token = match_token(ptr, tokens, args);
  2116. switch (token) {
  2117. case Opt_dev_config:
  2118. if (match_strlcpy(udev->dev_config, &args[0],
  2119. TCMU_CONFIG_LEN) == 0) {
  2120. ret = -EINVAL;
  2121. break;
  2122. }
  2123. pr_debug("TCMU: Referencing Path: %s\n", udev->dev_config);
  2124. break;
  2125. case Opt_dev_size:
  2126. ret = match_u64(&args[0], &udev->dev_size);
  2127. if (ret < 0)
  2128. pr_err("match_u64() failed for dev_size=. Error %d.\n",
  2129. ret);
  2130. break;
  2131. case Opt_hw_block_size:
  2132. ret = tcmu_set_dev_attrib(&args[0],
  2133. &(dev->dev_attrib.hw_block_size));
  2134. break;
  2135. case Opt_hw_max_sectors:
  2136. ret = tcmu_set_dev_attrib(&args[0],
  2137. &(dev->dev_attrib.hw_max_sectors));
  2138. break;
  2139. case Opt_nl_reply_supported:
  2140. ret = match_int(&args[0], &udev->nl_reply_supported);
  2141. if (ret < 0)
  2142. pr_err("match_int() failed for nl_reply_supported=. Error %d.\n",
  2143. ret);
  2144. break;
  2145. case Opt_max_data_area_mb:
  2146. ret = tcmu_set_max_blocks_param(udev, &args[0]);
  2147. break;
  2148. case Opt_data_pages_per_blk:
  2149. ret = tcmu_set_data_pages_per_blk(udev, &args[0]);
  2150. break;
  2151. case Opt_cmd_ring_size_mb:
  2152. ret = tcmu_set_cmd_ring_size(udev, &args[0]);
  2153. break;
  2154. default:
  2155. break;
  2156. }
  2157. if (ret)
  2158. break;
  2159. }
  2160. kfree(orig);
  2161. return (!ret) ? count : ret;
  2162. }
  2163. static ssize_t tcmu_show_configfs_dev_params(struct se_device *dev, char *b)
  2164. {
  2165. struct tcmu_dev *udev = TCMU_DEV(dev);
  2166. ssize_t bl = 0;
  2167. bl = sprintf(b + bl, "Config: %s ",
  2168. udev->dev_config[0] ? udev->dev_config : "NULL");
  2169. bl += sprintf(b + bl, "Size: %llu ", udev->dev_size);
  2170. bl += sprintf(b + bl, "MaxDataAreaMB: %u ", udev->data_area_mb);
  2171. bl += sprintf(b + bl, "DataPagesPerBlk: %u ", udev->data_pages_per_blk);
  2172. bl += sprintf(b + bl, "CmdRingSizeMB: %u\n",
  2173. (udev->cmdr_size + CMDR_OFF) >> 20);
  2174. return bl;
  2175. }
  2176. static sector_t tcmu_get_blocks(struct se_device *dev)
  2177. {
  2178. struct tcmu_dev *udev = TCMU_DEV(dev);
  2179. return div_u64(udev->dev_size - dev->dev_attrib.block_size,
  2180. dev->dev_attrib.block_size);
  2181. }
  2182. static sense_reason_t
  2183. tcmu_parse_cdb(struct se_cmd *cmd)
  2184. {
  2185. return passthrough_parse_cdb(cmd, tcmu_queue_cmd);
  2186. }
  2187. static ssize_t tcmu_cmd_time_out_show(struct config_item *item, char *page)
  2188. {
  2189. struct se_dev_attrib *da = container_of(to_config_group(item),
  2190. struct se_dev_attrib, da_group);
  2191. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2192. return snprintf(page, PAGE_SIZE, "%lu\n", udev->cmd_time_out / MSEC_PER_SEC);
  2193. }
  2194. static ssize_t tcmu_cmd_time_out_store(struct config_item *item, const char *page,
  2195. size_t count)
  2196. {
  2197. struct se_dev_attrib *da = container_of(to_config_group(item),
  2198. struct se_dev_attrib, da_group);
  2199. struct tcmu_dev *udev = container_of(da->da_dev,
  2200. struct tcmu_dev, se_dev);
  2201. u32 val;
  2202. int ret;
  2203. if (da->da_dev->export_count) {
  2204. pr_err("Unable to set tcmu cmd_time_out while exports exist\n");
  2205. return -EINVAL;
  2206. }
  2207. ret = kstrtou32(page, 0, &val);
  2208. if (ret < 0)
  2209. return ret;
  2210. udev->cmd_time_out = val * MSEC_PER_SEC;
  2211. return count;
  2212. }
  2213. CONFIGFS_ATTR(tcmu_, cmd_time_out);
  2214. static ssize_t tcmu_qfull_time_out_show(struct config_item *item, char *page)
  2215. {
  2216. struct se_dev_attrib *da = container_of(to_config_group(item),
  2217. struct se_dev_attrib, da_group);
  2218. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2219. return snprintf(page, PAGE_SIZE, "%ld\n", udev->qfull_time_out <= 0 ?
  2220. udev->qfull_time_out :
  2221. udev->qfull_time_out / MSEC_PER_SEC);
  2222. }
  2223. static ssize_t tcmu_qfull_time_out_store(struct config_item *item,
  2224. const char *page, size_t count)
  2225. {
  2226. struct se_dev_attrib *da = container_of(to_config_group(item),
  2227. struct se_dev_attrib, da_group);
  2228. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2229. s32 val;
  2230. int ret;
  2231. ret = kstrtos32(page, 0, &val);
  2232. if (ret < 0)
  2233. return ret;
  2234. if (val >= 0) {
  2235. udev->qfull_time_out = val * MSEC_PER_SEC;
  2236. } else if (val == -1) {
  2237. udev->qfull_time_out = val;
  2238. } else {
  2239. printk(KERN_ERR "Invalid qfull timeout value %d\n", val);
  2240. return -EINVAL;
  2241. }
  2242. return count;
  2243. }
  2244. CONFIGFS_ATTR(tcmu_, qfull_time_out);
  2245. static ssize_t tcmu_max_data_area_mb_show(struct config_item *item, char *page)
  2246. {
  2247. struct se_dev_attrib *da = container_of(to_config_group(item),
  2248. struct se_dev_attrib, da_group);
  2249. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2250. return snprintf(page, PAGE_SIZE, "%u\n", udev->data_area_mb);
  2251. }
  2252. CONFIGFS_ATTR_RO(tcmu_, max_data_area_mb);
  2253. static ssize_t tcmu_data_pages_per_blk_show(struct config_item *item,
  2254. char *page)
  2255. {
  2256. struct se_dev_attrib *da = container_of(to_config_group(item),
  2257. struct se_dev_attrib, da_group);
  2258. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2259. return snprintf(page, PAGE_SIZE, "%u\n", udev->data_pages_per_blk);
  2260. }
  2261. CONFIGFS_ATTR_RO(tcmu_, data_pages_per_blk);
  2262. static ssize_t tcmu_cmd_ring_size_mb_show(struct config_item *item, char *page)
  2263. {
  2264. struct se_dev_attrib *da = container_of(to_config_group(item),
  2265. struct se_dev_attrib, da_group);
  2266. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2267. return snprintf(page, PAGE_SIZE, "%u\n",
  2268. (udev->cmdr_size + CMDR_OFF) >> 20);
  2269. }
  2270. CONFIGFS_ATTR_RO(tcmu_, cmd_ring_size_mb);
  2271. static ssize_t tcmu_dev_config_show(struct config_item *item, char *page)
  2272. {
  2273. struct se_dev_attrib *da = container_of(to_config_group(item),
  2274. struct se_dev_attrib, da_group);
  2275. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2276. return snprintf(page, PAGE_SIZE, "%s\n", udev->dev_config);
  2277. }
  2278. static int tcmu_send_dev_config_event(struct tcmu_dev *udev,
  2279. const char *reconfig_data)
  2280. {
  2281. struct sk_buff *skb = NULL;
  2282. void *msg_header = NULL;
  2283. int ret = 0;
  2284. ret = tcmu_netlink_event_init(udev, TCMU_CMD_RECONFIG_DEVICE,
  2285. &skb, &msg_header);
  2286. if (ret < 0)
  2287. return ret;
  2288. ret = nla_put_string(skb, TCMU_ATTR_DEV_CFG, reconfig_data);
  2289. if (ret < 0) {
  2290. nlmsg_free(skb);
  2291. return ret;
  2292. }
  2293. return tcmu_netlink_event_send(udev, TCMU_CMD_RECONFIG_DEVICE,
  2294. skb, msg_header);
  2295. }
  2296. static ssize_t tcmu_dev_config_store(struct config_item *item, const char *page,
  2297. size_t count)
  2298. {
  2299. struct se_dev_attrib *da = container_of(to_config_group(item),
  2300. struct se_dev_attrib, da_group);
  2301. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2302. int ret, len;
  2303. len = strlen(page);
  2304. if (!len || len > TCMU_CONFIG_LEN - 1)
  2305. return -EINVAL;
  2306. /* Check if device has been configured before */
  2307. if (target_dev_configured(&udev->se_dev)) {
  2308. ret = tcmu_send_dev_config_event(udev, page);
  2309. if (ret) {
  2310. pr_err("Unable to reconfigure device\n");
  2311. return ret;
  2312. }
  2313. strscpy(udev->dev_config, page, TCMU_CONFIG_LEN);
  2314. ret = tcmu_update_uio_info(udev);
  2315. if (ret)
  2316. return ret;
  2317. return count;
  2318. }
  2319. strscpy(udev->dev_config, page, TCMU_CONFIG_LEN);
  2320. return count;
  2321. }
  2322. CONFIGFS_ATTR(tcmu_, dev_config);
  2323. static ssize_t tcmu_dev_size_show(struct config_item *item, char *page)
  2324. {
  2325. struct se_dev_attrib *da = container_of(to_config_group(item),
  2326. struct se_dev_attrib, da_group);
  2327. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2328. return snprintf(page, PAGE_SIZE, "%llu\n", udev->dev_size);
  2329. }
  2330. static int tcmu_send_dev_size_event(struct tcmu_dev *udev, u64 size)
  2331. {
  2332. struct sk_buff *skb = NULL;
  2333. void *msg_header = NULL;
  2334. int ret = 0;
  2335. ret = tcmu_netlink_event_init(udev, TCMU_CMD_RECONFIG_DEVICE,
  2336. &skb, &msg_header);
  2337. if (ret < 0)
  2338. return ret;
  2339. ret = nla_put_u64_64bit(skb, TCMU_ATTR_DEV_SIZE,
  2340. size, TCMU_ATTR_PAD);
  2341. if (ret < 0) {
  2342. nlmsg_free(skb);
  2343. return ret;
  2344. }
  2345. return tcmu_netlink_event_send(udev, TCMU_CMD_RECONFIG_DEVICE,
  2346. skb, msg_header);
  2347. }
  2348. static ssize_t tcmu_dev_size_store(struct config_item *item, const char *page,
  2349. size_t count)
  2350. {
  2351. struct se_dev_attrib *da = container_of(to_config_group(item),
  2352. struct se_dev_attrib, da_group);
  2353. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2354. u64 val;
  2355. int ret;
  2356. ret = kstrtou64(page, 0, &val);
  2357. if (ret < 0)
  2358. return ret;
  2359. /* Check if device has been configured before */
  2360. if (target_dev_configured(&udev->se_dev)) {
  2361. ret = tcmu_send_dev_size_event(udev, val);
  2362. if (ret) {
  2363. pr_err("Unable to reconfigure device\n");
  2364. return ret;
  2365. }
  2366. }
  2367. udev->dev_size = val;
  2368. return count;
  2369. }
  2370. CONFIGFS_ATTR(tcmu_, dev_size);
  2371. static ssize_t tcmu_nl_reply_supported_show(struct config_item *item,
  2372. char *page)
  2373. {
  2374. struct se_dev_attrib *da = container_of(to_config_group(item),
  2375. struct se_dev_attrib, da_group);
  2376. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2377. return snprintf(page, PAGE_SIZE, "%d\n", udev->nl_reply_supported);
  2378. }
  2379. static ssize_t tcmu_nl_reply_supported_store(struct config_item *item,
  2380. const char *page, size_t count)
  2381. {
  2382. struct se_dev_attrib *da = container_of(to_config_group(item),
  2383. struct se_dev_attrib, da_group);
  2384. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2385. s8 val;
  2386. int ret;
  2387. ret = kstrtos8(page, 0, &val);
  2388. if (ret < 0)
  2389. return ret;
  2390. udev->nl_reply_supported = val;
  2391. return count;
  2392. }
  2393. CONFIGFS_ATTR(tcmu_, nl_reply_supported);
  2394. static ssize_t tcmu_emulate_write_cache_show(struct config_item *item,
  2395. char *page)
  2396. {
  2397. struct se_dev_attrib *da = container_of(to_config_group(item),
  2398. struct se_dev_attrib, da_group);
  2399. return snprintf(page, PAGE_SIZE, "%i\n", da->emulate_write_cache);
  2400. }
  2401. static int tcmu_send_emulate_write_cache(struct tcmu_dev *udev, u8 val)
  2402. {
  2403. struct sk_buff *skb = NULL;
  2404. void *msg_header = NULL;
  2405. int ret = 0;
  2406. ret = tcmu_netlink_event_init(udev, TCMU_CMD_RECONFIG_DEVICE,
  2407. &skb, &msg_header);
  2408. if (ret < 0)
  2409. return ret;
  2410. ret = nla_put_u8(skb, TCMU_ATTR_WRITECACHE, val);
  2411. if (ret < 0) {
  2412. nlmsg_free(skb);
  2413. return ret;
  2414. }
  2415. return tcmu_netlink_event_send(udev, TCMU_CMD_RECONFIG_DEVICE,
  2416. skb, msg_header);
  2417. }
  2418. static ssize_t tcmu_emulate_write_cache_store(struct config_item *item,
  2419. const char *page, size_t count)
  2420. {
  2421. struct se_dev_attrib *da = container_of(to_config_group(item),
  2422. struct se_dev_attrib, da_group);
  2423. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2424. u8 val;
  2425. int ret;
  2426. ret = kstrtou8(page, 0, &val);
  2427. if (ret < 0)
  2428. return ret;
  2429. /* Check if device has been configured before */
  2430. if (target_dev_configured(&udev->se_dev)) {
  2431. ret = tcmu_send_emulate_write_cache(udev, val);
  2432. if (ret) {
  2433. pr_err("Unable to reconfigure device\n");
  2434. return ret;
  2435. }
  2436. }
  2437. da->emulate_write_cache = val;
  2438. return count;
  2439. }
  2440. CONFIGFS_ATTR(tcmu_, emulate_write_cache);
  2441. static ssize_t tcmu_tmr_notification_show(struct config_item *item, char *page)
  2442. {
  2443. struct se_dev_attrib *da = container_of(to_config_group(item),
  2444. struct se_dev_attrib, da_group);
  2445. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2446. return snprintf(page, PAGE_SIZE, "%i\n",
  2447. test_bit(TCMU_DEV_BIT_TMR_NOTIFY, &udev->flags));
  2448. }
  2449. static ssize_t tcmu_tmr_notification_store(struct config_item *item,
  2450. const char *page, size_t count)
  2451. {
  2452. struct se_dev_attrib *da = container_of(to_config_group(item),
  2453. struct se_dev_attrib, da_group);
  2454. struct tcmu_dev *udev = TCMU_DEV(da->da_dev);
  2455. u8 val;
  2456. int ret;
  2457. ret = kstrtou8(page, 0, &val);
  2458. if (ret < 0)
  2459. return ret;
  2460. if (val > 1)
  2461. return -EINVAL;
  2462. if (val)
  2463. set_bit(TCMU_DEV_BIT_TMR_NOTIFY, &udev->flags);
  2464. else
  2465. clear_bit(TCMU_DEV_BIT_TMR_NOTIFY, &udev->flags);
  2466. return count;
  2467. }
  2468. CONFIGFS_ATTR(tcmu_, tmr_notification);
  2469. static ssize_t tcmu_block_dev_show(struct config_item *item, char *page)
  2470. {
  2471. struct se_device *se_dev = container_of(to_config_group(item),
  2472. struct se_device,
  2473. dev_action_group);
  2474. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  2475. if (test_bit(TCMU_DEV_BIT_BLOCKED, &udev->flags))
  2476. return snprintf(page, PAGE_SIZE, "%s\n", "blocked");
  2477. else
  2478. return snprintf(page, PAGE_SIZE, "%s\n", "unblocked");
  2479. }
  2480. static ssize_t tcmu_block_dev_store(struct config_item *item, const char *page,
  2481. size_t count)
  2482. {
  2483. struct se_device *se_dev = container_of(to_config_group(item),
  2484. struct se_device,
  2485. dev_action_group);
  2486. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  2487. u8 val;
  2488. int ret;
  2489. if (!target_dev_configured(&udev->se_dev)) {
  2490. pr_err("Device is not configured.\n");
  2491. return -EINVAL;
  2492. }
  2493. ret = kstrtou8(page, 0, &val);
  2494. if (ret < 0)
  2495. return ret;
  2496. if (val > 1) {
  2497. pr_err("Invalid block value %d\n", val);
  2498. return -EINVAL;
  2499. }
  2500. if (!val)
  2501. tcmu_unblock_dev(udev);
  2502. else
  2503. tcmu_block_dev(udev);
  2504. return count;
  2505. }
  2506. CONFIGFS_ATTR(tcmu_, block_dev);
  2507. static ssize_t tcmu_reset_ring_store(struct config_item *item, const char *page,
  2508. size_t count)
  2509. {
  2510. struct se_device *se_dev = container_of(to_config_group(item),
  2511. struct se_device,
  2512. dev_action_group);
  2513. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  2514. u8 val;
  2515. int ret;
  2516. if (!target_dev_configured(&udev->se_dev)) {
  2517. pr_err("Device is not configured.\n");
  2518. return -EINVAL;
  2519. }
  2520. ret = kstrtou8(page, 0, &val);
  2521. if (ret < 0)
  2522. return ret;
  2523. if (val != 1 && val != 2) {
  2524. pr_err("Invalid reset ring value %d\n", val);
  2525. return -EINVAL;
  2526. }
  2527. tcmu_reset_ring(udev, val);
  2528. return count;
  2529. }
  2530. CONFIGFS_ATTR_WO(tcmu_, reset_ring);
  2531. static ssize_t tcmu_free_kept_buf_store(struct config_item *item, const char *page,
  2532. size_t count)
  2533. {
  2534. struct se_device *se_dev = container_of(to_config_group(item),
  2535. struct se_device,
  2536. dev_action_group);
  2537. struct tcmu_dev *udev = TCMU_DEV(se_dev);
  2538. struct tcmu_cmd *cmd;
  2539. u16 cmd_id;
  2540. int ret;
  2541. if (!target_dev_configured(&udev->se_dev)) {
  2542. pr_err("Device is not configured.\n");
  2543. return -EINVAL;
  2544. }
  2545. ret = kstrtou16(page, 0, &cmd_id);
  2546. if (ret < 0)
  2547. return ret;
  2548. mutex_lock(&udev->cmdr_lock);
  2549. {
  2550. XA_STATE(xas, &udev->commands, cmd_id);
  2551. xas_lock(&xas);
  2552. cmd = xas_load(&xas);
  2553. if (!cmd) {
  2554. pr_err("free_kept_buf: cmd_id %d not found\n", cmd_id);
  2555. count = -EINVAL;
  2556. xas_unlock(&xas);
  2557. goto out_unlock;
  2558. }
  2559. if (!test_bit(TCMU_CMD_BIT_KEEP_BUF, &cmd->flags)) {
  2560. pr_err("free_kept_buf: cmd_id %d was not completed with KEEP_BUF\n",
  2561. cmd_id);
  2562. count = -EINVAL;
  2563. xas_unlock(&xas);
  2564. goto out_unlock;
  2565. }
  2566. xas_store(&xas, NULL);
  2567. xas_unlock(&xas);
  2568. }
  2569. tcmu_cmd_free_data(cmd, cmd->dbi_cnt);
  2570. tcmu_free_cmd(cmd);
  2571. /*
  2572. * We only freed data space, not ring space. Therefore we dont call
  2573. * run_tmr_queue, but call run_qfull_queue if tmr_list is empty.
  2574. */
  2575. if (list_empty(&udev->tmr_queue))
  2576. run_qfull_queue(udev, false);
  2577. out_unlock:
  2578. mutex_unlock(&udev->cmdr_lock);
  2579. return count;
  2580. }
  2581. CONFIGFS_ATTR_WO(tcmu_, free_kept_buf);
  2582. static struct configfs_attribute *tcmu_attrib_attrs[] = {
  2583. &tcmu_attr_cmd_time_out,
  2584. &tcmu_attr_qfull_time_out,
  2585. &tcmu_attr_max_data_area_mb,
  2586. &tcmu_attr_data_pages_per_blk,
  2587. &tcmu_attr_cmd_ring_size_mb,
  2588. &tcmu_attr_dev_config,
  2589. &tcmu_attr_dev_size,
  2590. &tcmu_attr_emulate_write_cache,
  2591. &tcmu_attr_tmr_notification,
  2592. &tcmu_attr_nl_reply_supported,
  2593. NULL,
  2594. };
  2595. static struct configfs_attribute **tcmu_attrs;
  2596. static struct configfs_attribute *tcmu_action_attrs[] = {
  2597. &tcmu_attr_block_dev,
  2598. &tcmu_attr_reset_ring,
  2599. &tcmu_attr_free_kept_buf,
  2600. NULL,
  2601. };
  2602. static struct target_backend_ops tcmu_ops = {
  2603. .name = "user",
  2604. .owner = THIS_MODULE,
  2605. .transport_flags_default = TRANSPORT_FLAG_PASSTHROUGH,
  2606. .transport_flags_changeable = TRANSPORT_FLAG_PASSTHROUGH_PGR |
  2607. TRANSPORT_FLAG_PASSTHROUGH_ALUA,
  2608. .attach_hba = tcmu_attach_hba,
  2609. .detach_hba = tcmu_detach_hba,
  2610. .alloc_device = tcmu_alloc_device,
  2611. .configure_device = tcmu_configure_device,
  2612. .destroy_device = tcmu_destroy_device,
  2613. .free_device = tcmu_free_device,
  2614. .unplug_device = tcmu_unplug_device,
  2615. .plug_device = tcmu_plug_device,
  2616. .parse_cdb = tcmu_parse_cdb,
  2617. .tmr_notify = tcmu_tmr_notify,
  2618. .set_configfs_dev_params = tcmu_set_configfs_dev_params,
  2619. .show_configfs_dev_params = tcmu_show_configfs_dev_params,
  2620. .get_device_type = sbc_get_device_type,
  2621. .get_blocks = tcmu_get_blocks,
  2622. .tb_dev_action_attrs = tcmu_action_attrs,
  2623. };
  2624. static void find_free_blocks(void)
  2625. {
  2626. struct tcmu_dev *udev;
  2627. loff_t off;
  2628. u32 pages_freed, total_pages_freed = 0;
  2629. u32 start, end, block, total_blocks_freed = 0;
  2630. if (atomic_read(&global_page_count) <= tcmu_global_max_pages)
  2631. return;
  2632. mutex_lock(&root_udev_mutex);
  2633. list_for_each_entry(udev, &root_udev, node) {
  2634. mutex_lock(&udev->cmdr_lock);
  2635. if (!target_dev_configured(&udev->se_dev)) {
  2636. mutex_unlock(&udev->cmdr_lock);
  2637. continue;
  2638. }
  2639. /* Try to complete the finished commands first */
  2640. if (tcmu_handle_completions(udev))
  2641. run_qfull_queue(udev, false);
  2642. /* Skip the udevs in idle */
  2643. if (!udev->dbi_thresh) {
  2644. mutex_unlock(&udev->cmdr_lock);
  2645. continue;
  2646. }
  2647. end = udev->dbi_max + 1;
  2648. block = find_last_bit(udev->data_bitmap, end);
  2649. if (block == udev->dbi_max) {
  2650. /*
  2651. * The last bit is dbi_max, so it is not possible
  2652. * reclaim any blocks.
  2653. */
  2654. mutex_unlock(&udev->cmdr_lock);
  2655. continue;
  2656. } else if (block == end) {
  2657. /* The current udev will goto idle state */
  2658. udev->dbi_thresh = start = 0;
  2659. udev->dbi_max = 0;
  2660. } else {
  2661. udev->dbi_thresh = start = block + 1;
  2662. udev->dbi_max = block;
  2663. }
  2664. /*
  2665. * Release the block pages.
  2666. *
  2667. * Also note that since tcmu_vma_fault() gets an extra page
  2668. * refcount, tcmu_blocks_release() won't free pages if pages
  2669. * are mapped. This means it is safe to call
  2670. * tcmu_blocks_release() before unmap_mapping_range() which
  2671. * drops the refcount of any pages it unmaps and thus releases
  2672. * them.
  2673. */
  2674. pages_freed = tcmu_blocks_release(udev, start, end - 1);
  2675. /* Here will truncate the data area from off */
  2676. off = udev->data_off + (loff_t)start * udev->data_blk_size;
  2677. unmap_mapping_range(udev->inode->i_mapping, off, 0, 1);
  2678. mutex_unlock(&udev->cmdr_lock);
  2679. total_pages_freed += pages_freed;
  2680. total_blocks_freed += end - start;
  2681. pr_debug("Freed %u pages (total %u) from %u blocks (total %u) from %s.\n",
  2682. pages_freed, total_pages_freed, end - start,
  2683. total_blocks_freed, udev->name);
  2684. }
  2685. mutex_unlock(&root_udev_mutex);
  2686. if (atomic_read(&global_page_count) > tcmu_global_max_pages)
  2687. schedule_delayed_work(&tcmu_unmap_work, msecs_to_jiffies(5000));
  2688. }
  2689. static void check_timedout_devices(void)
  2690. {
  2691. struct tcmu_dev *udev, *tmp_dev;
  2692. struct tcmu_cmd *cmd, *tmp_cmd;
  2693. LIST_HEAD(devs);
  2694. spin_lock_bh(&timed_out_udevs_lock);
  2695. list_splice_init(&timed_out_udevs, &devs);
  2696. list_for_each_entry_safe(udev, tmp_dev, &devs, timedout_entry) {
  2697. list_del_init(&udev->timedout_entry);
  2698. spin_unlock_bh(&timed_out_udevs_lock);
  2699. mutex_lock(&udev->cmdr_lock);
  2700. /*
  2701. * If cmd_time_out is disabled but qfull is set deadline
  2702. * will only reflect the qfull timeout. Ignore it.
  2703. */
  2704. if (udev->cmd_time_out) {
  2705. list_for_each_entry_safe(cmd, tmp_cmd,
  2706. &udev->inflight_queue,
  2707. queue_entry) {
  2708. tcmu_check_expired_ring_cmd(cmd);
  2709. }
  2710. tcmu_set_next_deadline(&udev->inflight_queue,
  2711. &udev->cmd_timer);
  2712. }
  2713. list_for_each_entry_safe(cmd, tmp_cmd, &udev->qfull_queue,
  2714. queue_entry) {
  2715. tcmu_check_expired_queue_cmd(cmd);
  2716. }
  2717. tcmu_set_next_deadline(&udev->qfull_queue, &udev->qfull_timer);
  2718. mutex_unlock(&udev->cmdr_lock);
  2719. spin_lock_bh(&timed_out_udevs_lock);
  2720. }
  2721. spin_unlock_bh(&timed_out_udevs_lock);
  2722. }
  2723. static void tcmu_unmap_work_fn(struct work_struct *work)
  2724. {
  2725. check_timedout_devices();
  2726. find_free_blocks();
  2727. }
  2728. static int __init tcmu_module_init(void)
  2729. {
  2730. int ret, i, k, len = 0;
  2731. BUILD_BUG_ON((sizeof(struct tcmu_cmd_entry) % TCMU_OP_ALIGN_SIZE) != 0);
  2732. INIT_DELAYED_WORK(&tcmu_unmap_work, tcmu_unmap_work_fn);
  2733. tcmu_cmd_cache = kmem_cache_create("tcmu_cmd_cache",
  2734. sizeof(struct tcmu_cmd),
  2735. __alignof__(struct tcmu_cmd),
  2736. 0, NULL);
  2737. if (!tcmu_cmd_cache)
  2738. return -ENOMEM;
  2739. tcmu_root_device = root_device_register("tcm_user");
  2740. if (IS_ERR(tcmu_root_device)) {
  2741. ret = PTR_ERR(tcmu_root_device);
  2742. goto out_free_cache;
  2743. }
  2744. ret = genl_register_family(&tcmu_genl_family);
  2745. if (ret < 0) {
  2746. goto out_unreg_device;
  2747. }
  2748. for (i = 0; passthrough_attrib_attrs[i] != NULL; i++)
  2749. len += sizeof(struct configfs_attribute *);
  2750. for (i = 0; passthrough_pr_attrib_attrs[i] != NULL; i++)
  2751. len += sizeof(struct configfs_attribute *);
  2752. for (i = 0; tcmu_attrib_attrs[i] != NULL; i++)
  2753. len += sizeof(struct configfs_attribute *);
  2754. len += sizeof(struct configfs_attribute *);
  2755. tcmu_attrs = kzalloc(len, GFP_KERNEL);
  2756. if (!tcmu_attrs) {
  2757. ret = -ENOMEM;
  2758. goto out_unreg_genl;
  2759. }
  2760. for (i = 0; passthrough_attrib_attrs[i] != NULL; i++)
  2761. tcmu_attrs[i] = passthrough_attrib_attrs[i];
  2762. for (k = 0; passthrough_pr_attrib_attrs[k] != NULL; k++)
  2763. tcmu_attrs[i++] = passthrough_pr_attrib_attrs[k];
  2764. for (k = 0; tcmu_attrib_attrs[k] != NULL; k++)
  2765. tcmu_attrs[i++] = tcmu_attrib_attrs[k];
  2766. tcmu_ops.tb_dev_attrib_attrs = tcmu_attrs;
  2767. ret = transport_backend_register(&tcmu_ops);
  2768. if (ret)
  2769. goto out_attrs;
  2770. return 0;
  2771. out_attrs:
  2772. kfree(tcmu_attrs);
  2773. out_unreg_genl:
  2774. genl_unregister_family(&tcmu_genl_family);
  2775. out_unreg_device:
  2776. root_device_unregister(tcmu_root_device);
  2777. out_free_cache:
  2778. kmem_cache_destroy(tcmu_cmd_cache);
  2779. return ret;
  2780. }
  2781. static void __exit tcmu_module_exit(void)
  2782. {
  2783. cancel_delayed_work_sync(&tcmu_unmap_work);
  2784. target_backend_unregister(&tcmu_ops);
  2785. kfree(tcmu_attrs);
  2786. genl_unregister_family(&tcmu_genl_family);
  2787. root_device_unregister(tcmu_root_device);
  2788. kmem_cache_destroy(tcmu_cmd_cache);
  2789. }
  2790. MODULE_DESCRIPTION("TCM USER subsystem plugin");
  2791. MODULE_AUTHOR("Shaohua Li <shli@kernel.org>");
  2792. MODULE_AUTHOR("Andy Grover <agrover@redhat.com>");
  2793. MODULE_LICENSE("GPL");
  2794. module_init(tcmu_module_init);
  2795. module_exit(tcmu_module_exit);