2 * Copyright (c) 2014 VMware, Inc.
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at:
8 * http://www.apache.org/licenses/LICENSE-2.0
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
18 * XXX: OVS_USE_NL_INTERFACE is being used to keep the legacy DPIF interface
19 * alive while we transition over to the netlink based interface.
20 * OVS_USE_NL_INTERFACE = 0 => legacy inteface to use with dpif-windows.c
21 * OVS_USE_NL_INTERFACE = 1 => netlink inteface to use with ported dpif-linux.c
23 #if defined OVS_USE_NL_INTERFACE && OVS_USE_NL_INTERFACE == 1
40 #define OVS_DBG_MOD OVS_DBG_DATAPATH
43 #define NETLINK_FAMILY_NAME_LEN 48
47 * Netlink messages are grouped by family (aka type), and each family supports
48 * a set of commands, and can be passed both from kernel -> userspace or
49 * vice-versa. To call into the kernel, userspace uses a device operation which
50 * is outside of a netlink message.
52 * Each command results in the invocation of a handler function to implement the
53 * request functionality.
55 * Expectedly, only certain combinations of (device operation, netlink family,
58 * Here, we implement the basic infrastructure to perform validation on the
59 * incoming message, version checking, and also to invoke the corresponding
60 * handler to do the heavy-lifting.
64 * Handler for a given netlink command. Not all the parameters are used by all
67 typedef NTSTATUS(NetlinkCmdHandler)(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
70 typedef struct _NETLINK_CMD {
72 NetlinkCmdHandler *handler;
73 UINT32 supportedDevOp; /* Supported device operations. */
74 BOOLEAN validateDpIndex; /* Does command require a valid DP argument. */
75 } NETLINK_CMD, *PNETLINK_CMD;
77 /* A netlink family is a group of commands. */
78 typedef struct _NETLINK_FAMILY {
84 NETLINK_CMD *cmds; /* Array of netlink commands and handlers. */
86 } NETLINK_FAMILY, *PNETLINK_FAMILY;
89 * Device operations to tag netlink commands with. This is a bitmask since it is
90 * possible that a particular command can be invoked via different device
93 #define OVS_READ_DEV_OP (1 << 0)
94 #define OVS_WRITE_DEV_OP (1 << 1)
95 #define OVS_TRANSACTION_DEV_OP (1 << 2)
96 #define OVS_READ_EVENT_DEV_OP (1 << 3)
98 /* Handlers for the various netlink commands. */
99 static NetlinkCmdHandler OvsGetPidCmdHandler,
101 OvsPendEventCmdHandler,
102 OvsSubscribeEventCmdHandler,
104 OvsReadEventCmdHandler,
105 OvsGetVportCmdHandler;
107 static NTSTATUS HandleGetDpTransaction(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
109 static NTSTATUS HandleGetDpDump(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
111 static NTSTATUS HandleDpTransaction(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
115 * The various netlink families, along with the supported commands. Most of
116 * these families and commands are part of the openvswitch specification for a
117 * netlink datapath. In addition, each platform can implement a few families
118 * and commands as extensions.
121 /* Netlink control family: this is a Windows specific family. */
122 NETLINK_CMD nlControlFamilyCmdOps[] = {
123 { .cmd = OVS_CTRL_CMD_WIN_GET_PID,
124 .handler = OvsGetPidCmdHandler,
125 .supportedDevOp = OVS_TRANSACTION_DEV_OP,
126 .validateDpIndex = FALSE,
128 { .cmd = OVS_CTRL_CMD_WIN_PEND_REQ,
129 .handler = OvsPendEventCmdHandler,
130 .supportedDevOp = OVS_WRITE_DEV_OP,
131 .validateDpIndex = TRUE,
133 { .cmd = OVS_CTRL_CMD_MC_SUBSCRIBE_REQ,
134 .handler = OvsSubscribeEventCmdHandler,
135 .supportedDevOp = OVS_WRITE_DEV_OP,
136 .validateDpIndex = TRUE,
138 { .cmd = OVS_CTRL_CMD_EVENT_NOTIFY,
139 .handler = OvsReadEventCmdHandler,
140 .supportedDevOp = OVS_READ_EVENT_DEV_OP,
141 .validateDpIndex = FALSE,
145 NETLINK_FAMILY nlControlFamilyOps = {
146 .name = OVS_WIN_CONTROL_FAMILY,
147 .id = OVS_WIN_NL_CTRL_FAMILY_ID,
148 .version = OVS_WIN_CONTROL_VERSION,
149 .maxAttr = OVS_WIN_CONTROL_ATTR_MAX,
150 .cmds = nlControlFamilyCmdOps,
151 .opsCount = ARRAY_SIZE(nlControlFamilyCmdOps)
154 /* Netlink datapath family. */
155 NETLINK_CMD nlDatapathFamilyCmdOps[] = {
156 { .cmd = OVS_DP_CMD_GET,
157 .handler = OvsGetDpCmdHandler,
158 .supportedDevOp = OVS_WRITE_DEV_OP | OVS_READ_DEV_OP |
159 OVS_TRANSACTION_DEV_OP,
160 .validateDpIndex = FALSE
162 { .cmd = OVS_DP_CMD_SET,
163 .handler = OvsSetDpCmdHandler,
164 .supportedDevOp = OVS_WRITE_DEV_OP | OVS_READ_DEV_OP |
165 OVS_TRANSACTION_DEV_OP,
166 .validateDpIndex = TRUE
170 NETLINK_FAMILY nlDatapathFamilyOps = {
171 .name = OVS_DATAPATH_FAMILY,
172 .id = OVS_WIN_NL_DATAPATH_FAMILY_ID,
173 .version = OVS_DATAPATH_VERSION,
174 .maxAttr = OVS_DP_ATTR_MAX,
175 .cmds = nlDatapathFamilyCmdOps,
176 .opsCount = ARRAY_SIZE(nlDatapathFamilyCmdOps)
179 /* Netlink packet family. */
180 /* XXX: Add commands here. */
181 NETLINK_FAMILY nlPacketFamilyOps = {
182 .name = OVS_PACKET_FAMILY,
183 .id = OVS_WIN_NL_PACKET_FAMILY_ID,
184 .version = OVS_PACKET_VERSION,
185 .maxAttr = OVS_PACKET_ATTR_MAX,
186 .cmds = NULL, /* XXX: placeholder. */
190 /* Netlink vport family. */
191 NETLINK_CMD nlVportFamilyCmdOps[] = {
192 { .cmd = OVS_VPORT_CMD_GET,
193 .handler = OvsGetVportCmdHandler,
194 .supportedDevOp = OVS_WRITE_DEV_OP | OVS_READ_DEV_OP |
195 OVS_TRANSACTION_DEV_OP,
196 .validateDpIndex = TRUE
200 NETLINK_FAMILY nlVportFamilyOps = {
201 .name = OVS_VPORT_FAMILY,
202 .id = OVS_WIN_NL_VPORT_FAMILY_ID,
203 .version = OVS_VPORT_VERSION,
204 .maxAttr = OVS_VPORT_ATTR_MAX,
205 .cmds = nlVportFamilyCmdOps,
206 .opsCount = ARRAY_SIZE(nlVportFamilyCmdOps)
209 /* Netlink flow family. */
211 NETLINK_CMD nlFlowFamilyCmdOps[] = {
212 { .cmd = OVS_FLOW_CMD_NEW,
213 .handler = OvsFlowNlNewCmdHandler,
214 .supportedDevOp = OVS_TRANSACTION_DEV_OP,
215 .validateDpIndex = TRUE
217 { .cmd = OVS_FLOW_CMD_SET,
218 .handler = OvsFlowNlNewCmdHandler,
219 .supportedDevOp = OVS_TRANSACTION_DEV_OP,
220 .validateDpIndex = FALSE
224 NETLINK_FAMILY nlFLowFamilyOps = {
225 .name = OVS_FLOW_FAMILY,
226 .id = OVS_WIN_NL_FLOW_FAMILY_ID,
227 .version = OVS_FLOW_VERSION,
228 .maxAttr = OVS_FLOW_ATTR_MAX,
229 .cmds = nlFlowFamilyCmdOps,
230 .opsCount = ARRAY_SIZE(nlFlowFamilyCmdOps)
233 static NTSTATUS MapIrpOutputBuffer(PIRP irp,
235 UINT32 requiredLength,
237 static NTSTATUS ValidateNetlinkCmd(UINT32 devOp,
238 POVS_OPEN_INSTANCE instance,
240 NETLINK_FAMILY *nlFamilyOps);
241 static NTSTATUS InvokeNetlinkCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
242 NETLINK_FAMILY *nlFamilyOps,
244 static NTSTATUS OvsSetupDumpStart(POVS_USER_PARAMS_CONTEXT usrParamsCtx);
247 /* Handles to the device object for communication with userspace. */
248 NDIS_HANDLE gOvsDeviceHandle;
249 PDEVICE_OBJECT gOvsDeviceObject;
251 _Dispatch_type_(IRP_MJ_CREATE)
252 _Dispatch_type_(IRP_MJ_CLOSE)
253 DRIVER_DISPATCH OvsOpenCloseDevice;
255 _Dispatch_type_(IRP_MJ_CLEANUP)
256 DRIVER_DISPATCH OvsCleanupDevice;
258 _Dispatch_type_(IRP_MJ_DEVICE_CONTROL)
259 DRIVER_DISPATCH OvsDeviceControl;
262 #pragma alloc_text(INIT, OvsCreateDeviceObject)
263 #pragma alloc_text(PAGE, OvsOpenCloseDevice)
264 #pragma alloc_text(PAGE, OvsCleanupDevice)
265 #pragma alloc_text(PAGE, OvsDeviceControl)
266 #endif // ALLOC_PRAGMA
269 * We might hit this limit easily since userspace opens a netlink descriptor for
270 * each thread, and at least one descriptor per vport. Revisit this later.
272 #define OVS_MAX_OPEN_INSTANCES 512
273 #define OVS_SYSTEM_DP_NAME "ovs-system"
275 POVS_OPEN_INSTANCE ovsOpenInstanceArray[OVS_MAX_OPEN_INSTANCES];
276 UINT32 ovsNumberOfOpenInstances;
277 extern POVS_SWITCH_CONTEXT gOvsSwitchContext;
279 NDIS_SPIN_LOCK ovsCtrlLockObj;
280 PNDIS_SPIN_LOCK gOvsCtrlLock;
286 gOvsCtrlLock = &ovsCtrlLockObj;
287 NdisAllocateSpinLock(gOvsCtrlLock);
295 OvsCleanupEventQueue();
297 NdisFreeSpinLock(gOvsCtrlLock);
306 NdisAcquireSpinLock(gOvsCtrlLock);
312 NdisReleaseSpinLock(gOvsCtrlLock);
317 * --------------------------------------------------------------------------
318 * Creates the communication device between user and kernel, and also
319 * initializes the data associated data structures.
320 * --------------------------------------------------------------------------
323 OvsCreateDeviceObject(NDIS_HANDLE ovsExtDriverHandle)
325 NDIS_STATUS status = NDIS_STATUS_SUCCESS;
326 UNICODE_STRING deviceName;
327 UNICODE_STRING symbolicDeviceName;
328 PDRIVER_DISPATCH dispatchTable[IRP_MJ_MAXIMUM_FUNCTION+1];
329 NDIS_DEVICE_OBJECT_ATTRIBUTES deviceAttributes;
330 OVS_LOG_TRACE("ovsExtDriverHandle: %p", ovsExtDriverHandle);
332 RtlZeroMemory(dispatchTable,
333 (IRP_MJ_MAXIMUM_FUNCTION + 1) * sizeof (PDRIVER_DISPATCH));
334 dispatchTable[IRP_MJ_CREATE] = OvsOpenCloseDevice;
335 dispatchTable[IRP_MJ_CLOSE] = OvsOpenCloseDevice;
336 dispatchTable[IRP_MJ_CLEANUP] = OvsCleanupDevice;
337 dispatchTable[IRP_MJ_DEVICE_CONTROL] = OvsDeviceControl;
339 NdisInitUnicodeString(&deviceName, OVS_DEVICE_NAME_NT);
340 NdisInitUnicodeString(&symbolicDeviceName, OVS_DEVICE_NAME_DOS);
342 RtlZeroMemory(&deviceAttributes, sizeof (NDIS_DEVICE_OBJECT_ATTRIBUTES));
344 OVS_INIT_OBJECT_HEADER(&deviceAttributes.Header,
345 NDIS_OBJECT_TYPE_DEVICE_OBJECT_ATTRIBUTES,
346 NDIS_DEVICE_OBJECT_ATTRIBUTES_REVISION_1,
347 sizeof (NDIS_DEVICE_OBJECT_ATTRIBUTES));
349 deviceAttributes.DeviceName = &deviceName;
350 deviceAttributes.SymbolicName = &symbolicDeviceName;
351 deviceAttributes.MajorFunctions = dispatchTable;
352 deviceAttributes.ExtensionSize = sizeof (OVS_DEVICE_EXTENSION);
354 status = NdisRegisterDeviceEx(ovsExtDriverHandle,
358 if (status != NDIS_STATUS_SUCCESS) {
359 POVS_DEVICE_EXTENSION ovsExt =
360 (POVS_DEVICE_EXTENSION)NdisGetDeviceReservedExtension(gOvsDeviceObject);
361 ASSERT(gOvsDeviceObject != NULL);
362 ASSERT(gOvsDeviceHandle != NULL);
365 ovsExt->numberOpenInstance = 0;
368 /* Initialize the associated data structures. */
371 OVS_LOG_TRACE("DeviceObject: %p", gOvsDeviceObject);
377 OvsDeleteDeviceObject()
379 if (gOvsDeviceHandle) {
381 POVS_DEVICE_EXTENSION ovsExt = (POVS_DEVICE_EXTENSION)
382 NdisGetDeviceReservedExtension(gOvsDeviceObject);
384 ASSERT(ovsExt->numberOpenInstance == 0);
388 ASSERT(gOvsDeviceObject);
389 NdisDeregisterDeviceEx(gOvsDeviceHandle);
390 gOvsDeviceHandle = NULL;
391 gOvsDeviceObject = NULL;
397 OvsGetOpenInstance(PFILE_OBJECT fileObject,
400 POVS_OPEN_INSTANCE instance = (POVS_OPEN_INSTANCE)fileObject->FsContext;
402 ASSERT(instance->fileObject == fileObject);
403 if (gOvsSwitchContext == NULL ||
404 gOvsSwitchContext->dpNo != dpNo) {
412 OvsFindOpenInstance(PFILE_OBJECT fileObject)
415 for (i = 0, j = 0; i < OVS_MAX_OPEN_INSTANCES &&
416 j < ovsNumberOfOpenInstances; i++) {
417 if (ovsOpenInstanceArray[i]) {
418 if (ovsOpenInstanceArray[i]->fileObject == fileObject) {
419 return ovsOpenInstanceArray[i];
428 OvsAddOpenInstance(POVS_DEVICE_EXTENSION ovsExt,
429 PFILE_OBJECT fileObject)
431 POVS_OPEN_INSTANCE instance =
432 (POVS_OPEN_INSTANCE) OvsAllocateMemory(sizeof (OVS_OPEN_INSTANCE));
435 if (instance == NULL) {
436 return STATUS_NO_MEMORY;
438 OvsAcquireCtrlLock();
439 ASSERT(OvsFindOpenInstance(fileObject) == NULL);
441 if (ovsNumberOfOpenInstances >= OVS_MAX_OPEN_INSTANCES) {
442 OvsReleaseCtrlLock();
443 OvsFreeMemory(instance);
444 return STATUS_INSUFFICIENT_RESOURCES;
446 RtlZeroMemory(instance, sizeof (OVS_OPEN_INSTANCE));
448 for (i = 0; i < OVS_MAX_OPEN_INSTANCES; i++) {
449 if (ovsOpenInstanceArray[i] == NULL) {
450 ovsOpenInstanceArray[i] = instance;
451 instance->cookie = i;
455 ASSERT(i < OVS_MAX_OPEN_INSTANCES);
456 instance->fileObject = fileObject;
457 ASSERT(fileObject->FsContext == NULL);
458 instance->pid = (UINT32)InterlockedIncrement((LONG volatile *)&ovsExt->pidCount);
459 if (instance->pid == 0) {
460 /* XXX: check for rollover. */
462 fileObject->FsContext = instance;
463 OvsReleaseCtrlLock();
464 return STATUS_SUCCESS;
468 OvsCleanupOpenInstance(PFILE_OBJECT fileObject)
470 POVS_OPEN_INSTANCE instance = (POVS_OPEN_INSTANCE)fileObject->FsContext;
472 ASSERT(fileObject == instance->fileObject);
473 OvsCleanupEvent(instance);
474 OvsCleanupPacketQueue(instance);
478 OvsRemoveOpenInstance(PFILE_OBJECT fileObject)
480 POVS_OPEN_INSTANCE instance;
481 ASSERT(fileObject->FsContext);
482 instance = (POVS_OPEN_INSTANCE)fileObject->FsContext;
483 ASSERT(instance->cookie < OVS_MAX_OPEN_INSTANCES);
485 OvsAcquireCtrlLock();
486 fileObject->FsContext = NULL;
487 ASSERT(ovsOpenInstanceArray[instance->cookie] == instance);
488 ovsOpenInstanceArray[instance->cookie] = NULL;
489 OvsReleaseCtrlLock();
490 ASSERT(instance->eventQueue == NULL);
491 ASSERT (instance->packetQueue == NULL);
492 OvsFreeMemory(instance);
496 OvsCompleteIrpRequest(PIRP irp,
500 irp->IoStatus.Information = infoPtr;
501 irp->IoStatus.Status = status;
502 IoCompleteRequest(irp, IO_NO_INCREMENT);
508 OvsOpenCloseDevice(PDEVICE_OBJECT deviceObject,
511 PIO_STACK_LOCATION irpSp;
512 NTSTATUS status = STATUS_SUCCESS;
513 PFILE_OBJECT fileObject;
514 POVS_DEVICE_EXTENSION ovsExt =
515 (POVS_DEVICE_EXTENSION)NdisGetDeviceReservedExtension(deviceObject);
517 ASSERT(deviceObject == gOvsDeviceObject);
518 ASSERT(ovsExt != NULL);
520 irpSp = IoGetCurrentIrpStackLocation(irp);
521 fileObject = irpSp->FileObject;
522 OVS_LOG_TRACE("DeviceObject: %p, fileObject:%p, instance: %u",
523 deviceObject, fileObject,
524 ovsExt->numberOpenInstance);
526 switch (irpSp->MajorFunction) {
528 status = OvsAddOpenInstance(ovsExt, fileObject);
529 if (STATUS_SUCCESS == status) {
530 InterlockedIncrement((LONG volatile *)&ovsExt->numberOpenInstance);
534 ASSERT(ovsExt->numberOpenInstance > 0);
535 OvsRemoveOpenInstance(fileObject);
536 InterlockedDecrement((LONG volatile *)&ovsExt->numberOpenInstance);
541 return OvsCompleteIrpRequest(irp, (ULONG_PTR)0, status);
544 _Use_decl_annotations_
546 OvsCleanupDevice(PDEVICE_OBJECT deviceObject,
550 PIO_STACK_LOCATION irpSp;
551 PFILE_OBJECT fileObject;
553 NTSTATUS status = STATUS_SUCCESS;
555 POVS_DEVICE_EXTENSION ovsExt =
556 (POVS_DEVICE_EXTENSION)NdisGetDeviceReservedExtension(deviceObject);
558 ASSERT(ovsExt->numberOpenInstance > 0);
561 UNREFERENCED_PARAMETER(deviceObject);
563 ASSERT(deviceObject == gOvsDeviceObject);
564 irpSp = IoGetCurrentIrpStackLocation(irp);
565 fileObject = irpSp->FileObject;
567 ASSERT(irpSp->MajorFunction == IRP_MJ_CLEANUP);
569 OvsCleanupOpenInstance(fileObject);
571 return OvsCompleteIrpRequest(irp, (ULONG_PTR)0, status);
576 * --------------------------------------------------------------------------
577 * IOCTL function handler for the device.
578 * --------------------------------------------------------------------------
581 OvsDeviceControl(PDEVICE_OBJECT deviceObject,
585 PIO_STACK_LOCATION irpSp;
586 NTSTATUS status = STATUS_SUCCESS;
587 PFILE_OBJECT fileObject;
588 PVOID inputBuffer = NULL;
589 PVOID outputBuffer = NULL;
590 UINT32 inputBufferLen, outputBufferLen;
591 UINT32 code, replyLen = 0;
592 POVS_OPEN_INSTANCE instance;
594 OVS_MESSAGE ovsMsgReadOp;
596 NETLINK_FAMILY *nlFamilyOps;
597 OVS_USER_PARAMS_CONTEXT usrParamsCtx;
600 POVS_DEVICE_EXTENSION ovsExt =
601 (POVS_DEVICE_EXTENSION)NdisGetDeviceReservedExtension(deviceObject);
602 ASSERT(deviceObject == gOvsDeviceObject);
604 ASSERT(ovsExt->numberOpenInstance > 0);
606 UNREFERENCED_PARAMETER(deviceObject);
609 irpSp = IoGetCurrentIrpStackLocation(irp);
611 ASSERT(irpSp->MajorFunction == IRP_MJ_DEVICE_CONTROL);
612 ASSERT(irpSp->FileObject != NULL);
614 fileObject = irpSp->FileObject;
615 instance = (POVS_OPEN_INSTANCE)fileObject->FsContext;
616 code = irpSp->Parameters.DeviceIoControl.IoControlCode;
617 inputBufferLen = irpSp->Parameters.DeviceIoControl.InputBufferLength;
618 outputBufferLen = irpSp->Parameters.DeviceIoControl.OutputBufferLength;
619 inputBuffer = irp->AssociatedIrp.SystemBuffer;
621 /* Concurrent netlink operations are not supported. */
622 if (InterlockedCompareExchange((LONG volatile *)&instance->inUse, 1, 0)) {
623 status = STATUS_RESOURCE_IN_USE;
628 * Validate the input/output buffer arguments depending on the type of the
632 case OVS_IOCTL_TRANSACT:
633 /* Input buffer is mandatory, output buffer is optional. */
634 if (outputBufferLen != 0) {
635 status = MapIrpOutputBuffer(irp, outputBufferLen,
636 sizeof *ovsMsg, &outputBuffer);
637 if (status != STATUS_SUCCESS) {
640 ASSERT(outputBuffer);
643 if (inputBufferLen < sizeof (*ovsMsg)) {
644 status = STATUS_NDIS_INVALID_LENGTH;
648 ovsMsg = inputBuffer;
649 devOp = OVS_TRANSACTION_DEV_OP;
652 case OVS_IOCTL_READ_EVENT:
653 /* This IOCTL is used to read events */
654 if (outputBufferLen != 0) {
655 status = MapIrpOutputBuffer(irp, outputBufferLen,
656 sizeof *ovsMsg, &outputBuffer);
657 if (status != STATUS_SUCCESS) {
660 ASSERT(outputBuffer);
662 status = STATUS_NDIS_INVALID_LENGTH;
668 ovsMsg = &ovsMsgReadOp;
669 ovsMsg->nlMsg.nlmsgType = OVS_WIN_NL_CTRL_FAMILY_ID;
670 /* An "artificial" command so we can use NL family function table*/
671 ovsMsg->genlMsg.cmd = OVS_CTRL_CMD_EVENT_NOTIFY;
672 devOp = OVS_READ_DEV_OP;
676 /* Output buffer is mandatory. */
677 if (outputBufferLen != 0) {
678 status = MapIrpOutputBuffer(irp, outputBufferLen,
679 sizeof *ovsMsg, &outputBuffer);
680 if (status != STATUS_SUCCESS) {
683 ASSERT(outputBuffer);
685 status = STATUS_NDIS_INVALID_LENGTH;
690 * Operate in the mode that read ioctl is similar to ReadFile(). This
691 * might change as the userspace code gets implemented.
697 * For implementing read (ioctl or otherwise), we need to store some
698 * state in the instance to indicate the command that started the dump
699 * operation. The state can setup 'ovsMsgReadOp' appropriately. Note
700 * that 'ovsMsgReadOp' is needed only in this function to call into the
701 * appropraite handler. The handler itself can access the state in the
704 * In the absence of a dump start, return 0 bytes.
706 if (instance->dumpState.ovsMsg == NULL) {
708 status = STATUS_SUCCESS;
711 RtlCopyMemory(&ovsMsgReadOp, instance->dumpState.ovsMsg,
712 sizeof (ovsMsgReadOp));
714 /* Create an NL message for consumption. */
715 ovsMsg = &ovsMsgReadOp;
716 devOp = OVS_READ_DEV_OP;
720 case OVS_IOCTL_WRITE:
721 /* Input buffer is mandatory. */
722 if (inputBufferLen < sizeof (*ovsMsg)) {
723 status = STATUS_NDIS_INVALID_LENGTH;
727 ovsMsg = inputBuffer;
728 devOp = OVS_WRITE_DEV_OP;
732 status = STATUS_INVALID_DEVICE_REQUEST;
737 switch (ovsMsg->nlMsg.nlmsgType) {
738 case OVS_WIN_NL_CTRL_FAMILY_ID:
739 nlFamilyOps = &nlControlFamilyOps;
741 case OVS_WIN_NL_DATAPATH_FAMILY_ID:
742 nlFamilyOps = &nlDatapathFamilyOps;
744 case OVS_WIN_NL_FLOW_FAMILY_ID:
745 nlFamilyOps = &nlFLowFamilyOps;
747 case OVS_WIN_NL_PACKET_FAMILY_ID:
748 status = STATUS_NOT_IMPLEMENTED;
750 case OVS_WIN_NL_VPORT_FAMILY_ID:
751 nlFamilyOps = &nlVportFamilyOps;
754 status = STATUS_INVALID_PARAMETER;
759 * For read operation, the netlink command has already been validated
762 if (devOp != OVS_READ_DEV_OP) {
763 status = ValidateNetlinkCmd(devOp, instance, ovsMsg, nlFamilyOps);
764 if (status != STATUS_SUCCESS) {
769 InitUserParamsCtx(irp, instance, devOp, ovsMsg,
770 inputBuffer, inputBufferLen,
771 outputBuffer, outputBufferLen,
774 status = InvokeNetlinkCmdHandler(&usrParamsCtx, nlFamilyOps, &replyLen);
779 return OvsCompleteIrpRequest(irp, (ULONG_PTR)replyLen, status);
784 * --------------------------------------------------------------------------
785 * Function to validate a netlink command. Only certain combinations of
786 * (device operation, netlink family, command) are valid.
787 * --------------------------------------------------------------------------
790 ValidateNetlinkCmd(UINT32 devOp,
791 POVS_OPEN_INSTANCE instance,
793 NETLINK_FAMILY *nlFamilyOps)
795 NTSTATUS status = STATUS_INVALID_PARAMETER;
798 for (i = 0; i < nlFamilyOps->opsCount; i++) {
799 if (nlFamilyOps->cmds[i].cmd == ovsMsg->genlMsg.cmd) {
800 /* Validate if the command is valid for the device operation. */
801 if ((devOp & nlFamilyOps->cmds[i].supportedDevOp) == 0) {
802 status = STATUS_INVALID_PARAMETER;
806 /* Validate the version. */
807 if (nlFamilyOps->version > ovsMsg->genlMsg.version) {
808 status = STATUS_INVALID_PARAMETER;
812 /* Validate the DP for commands that require a DP. */
813 if (nlFamilyOps->cmds[i].validateDpIndex == TRUE) {
814 OvsAcquireCtrlLock();
815 if (ovsMsg->ovsHdr.dp_ifindex !=
816 (INT)gOvsSwitchContext->dpNo) {
817 status = STATUS_INVALID_PARAMETER;
818 OvsReleaseCtrlLock();
821 OvsReleaseCtrlLock();
824 /* Validate the PID. */
825 if (ovsMsg->genlMsg.cmd != OVS_CTRL_CMD_WIN_GET_PID) {
826 if (ovsMsg->nlMsg.nlmsgPid != instance->pid) {
827 status = STATUS_INVALID_PARAMETER;
832 status = STATUS_SUCCESS;
842 * --------------------------------------------------------------------------
843 * Function to invoke the netlink command handler.
844 * --------------------------------------------------------------------------
847 InvokeNetlinkCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
848 NETLINK_FAMILY *nlFamilyOps,
851 NTSTATUS status = STATUS_INVALID_PARAMETER;
854 for (i = 0; i < nlFamilyOps->opsCount; i++) {
855 if (nlFamilyOps->cmds[i].cmd == usrParamsCtx->ovsMsg->genlMsg.cmd) {
856 NetlinkCmdHandler *handler = nlFamilyOps->cmds[i].handler;
859 status = handler(usrParamsCtx, replyLen);
869 * --------------------------------------------------------------------------
870 * Command Handler for 'OVS_CTRL_CMD_WIN_GET_PID'.
872 * Each handle on the device is assigned a unique PID when the handle is
873 * created. On platforms that support netlink natively, the PID is available
874 * to userspace when the netlink socket is created. However, without native
875 * netlink support on Windows, OVS datapath generates the PID and lets the
876 * userspace query it.
878 * This function implements the query.
879 * --------------------------------------------------------------------------
882 OvsGetPidCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
885 POVS_MESSAGE msgIn = (POVS_MESSAGE)usrParamsCtx->inputBuffer;
886 POVS_MESSAGE msgOut = (POVS_MESSAGE)usrParamsCtx->outputBuffer;
888 if (usrParamsCtx->outputLength >= sizeof *msgOut) {
889 POVS_OPEN_INSTANCE instance =
890 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
892 RtlZeroMemory(msgOut, sizeof *msgOut);
893 msgOut->nlMsg.nlmsgSeq = msgIn->nlMsg.nlmsgSeq;
894 msgOut->nlMsg.nlmsgPid = instance->pid;
895 *replyLen = sizeof *msgOut;
896 /* XXX: We might need to return the DP index as well. */
898 return STATUS_NDIS_INVALID_LENGTH;
901 return STATUS_SUCCESS;
905 * --------------------------------------------------------------------------
906 * Utility function to fill up information about the datapath in a reply to
908 * Assumes that 'gOvsCtrlLock' lock is acquired.
909 * --------------------------------------------------------------------------
912 OvsDpFillInfo(POVS_SWITCH_CONTEXT ovsSwitchContext,
917 OVS_MESSAGE msgOutTmp;
918 OVS_DATAPATH *datapath = &ovsSwitchContext->datapath;
921 /* XXX: Add API for nlBuf->bufRemLen. */
922 ASSERT(NlBufAt(nlBuf, 0, 0) != 0 && nlBuf->bufRemLen >= sizeof *msgIn);
924 msgOutTmp.nlMsg.nlmsgType = OVS_WIN_NL_DATAPATH_FAMILY_ID;
925 msgOutTmp.nlMsg.nlmsgFlags = 0; /* XXX: ? */
926 msgOutTmp.nlMsg.nlmsgSeq = msgIn->nlMsg.nlmsgSeq;
927 msgOutTmp.nlMsg.nlmsgPid = msgIn->nlMsg.nlmsgPid;
929 msgOutTmp.genlMsg.cmd = OVS_DP_CMD_GET;
930 msgOutTmp.genlMsg.version = nlDatapathFamilyOps.version;
931 msgOutTmp.genlMsg.reserved = 0;
933 msgOutTmp.ovsHdr.dp_ifindex = ovsSwitchContext->dpNo;
935 writeOk = NlMsgPutHead(nlBuf, (PCHAR)&msgOutTmp, sizeof msgOutTmp);
937 writeOk = NlMsgPutTailString(nlBuf, OVS_DP_ATTR_NAME,
941 OVS_DP_STATS dpStats;
943 dpStats.n_hit = datapath->hits;
944 dpStats.n_missed = datapath->misses;
945 dpStats.n_lost = datapath->lost;
946 dpStats.n_flows = datapath->nFlows;
947 writeOk = NlMsgPutTailUnspec(nlBuf, OVS_DP_ATTR_STATS,
948 (PCHAR)&dpStats, sizeof dpStats);
950 nlMsg = (PNL_MSG_HDR)NlBufAt(nlBuf, 0, 0);
951 nlMsg->nlmsgLen = NlBufSize(nlBuf);
953 return writeOk ? STATUS_SUCCESS : STATUS_INVALID_BUFFER_SIZE;
957 * --------------------------------------------------------------------------
958 * Handler for queueing an IRP used for event notification. The IRP is
959 * completed when a port state changes. STATUS_PENDING is returned on
960 * success. User mode keep a pending IRP at all times.
961 * --------------------------------------------------------------------------
964 OvsPendEventCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
969 UNREFERENCED_PARAMETER(replyLen);
971 POVS_OPEN_INSTANCE instance =
972 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
973 POVS_MESSAGE msgIn = (POVS_MESSAGE)usrParamsCtx->inputBuffer;
976 poll.dpNo = msgIn->ovsHdr.dp_ifindex;
977 status = OvsWaitEventIoctl(usrParamsCtx->irp, instance->fileObject,
984 * --------------------------------------------------------------------------
985 * Handler for the subscription for the event queue
986 * --------------------------------------------------------------------------
989 OvsSubscribeEventCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
993 OVS_EVENT_SUBSCRIBE request;
997 const NL_POLICY policy[] = {
998 [OVS_NL_ATTR_MCAST_GRP] = {.type = NL_A_U32 },
999 [OVS_NL_ATTR_MCAST_JOIN] = {.type = NL_A_U8 },
1002 UNREFERENCED_PARAMETER(replyLen);
1004 POVS_OPEN_INSTANCE instance =
1005 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
1006 POVS_MESSAGE msgIn = (POVS_MESSAGE)usrParamsCtx->inputBuffer;
1008 rc = NlAttrParse(&msgIn->nlMsg, sizeof (*msgIn),
1009 NlMsgAttrsLen((PNL_MSG_HDR)msgIn), policy, attrs, 2);
1011 status = STATUS_INVALID_PARAMETER;
1015 /* XXX Ignore the MC group for now */
1016 join = NlAttrGetU8(attrs[OVS_NL_ATTR_MCAST_JOIN]);
1017 request.dpNo = msgIn->ovsHdr.dp_ifindex;
1018 request.subscribe = join;
1019 request.mask = OVS_EVENT_MASK_ALL;
1021 status = OvsSubscribeEventIoctl(instance->fileObject, &request,
1029 * --------------------------------------------------------------------------
1030 * Command Handler for 'OVS_DP_CMD_GET'.
1032 * The function handles both the dump based as well as the transaction based
1033 * 'OVS_DP_CMD_GET' command. In the dump command, it handles the initial
1034 * call to setup dump state, as well as subsequent calls to continue dumping
1036 * --------------------------------------------------------------------------
1039 OvsGetDpCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1042 if (usrParamsCtx->devOp == OVS_TRANSACTION_DEV_OP) {
1043 return HandleGetDpTransaction(usrParamsCtx, replyLen);
1045 return HandleGetDpDump(usrParamsCtx, replyLen);
1050 * --------------------------------------------------------------------------
1051 * Function for handling the transaction based 'OVS_DP_CMD_GET' command.
1052 * --------------------------------------------------------------------------
1055 HandleGetDpTransaction(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1058 return HandleDpTransaction(usrParamsCtx, replyLen);
1063 * --------------------------------------------------------------------------
1064 * Function for handling the dump-based 'OVS_DP_CMD_GET' command.
1065 * --------------------------------------------------------------------------
1068 HandleGetDpDump(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1071 POVS_MESSAGE msgOut = (POVS_MESSAGE)usrParamsCtx->outputBuffer;
1072 POVS_OPEN_INSTANCE instance =
1073 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
1075 if (usrParamsCtx->devOp == OVS_WRITE_DEV_OP) {
1077 OvsSetupDumpStart(usrParamsCtx);
1081 POVS_MESSAGE msgIn = instance->dumpState.ovsMsg;
1083 ASSERT(usrParamsCtx->devOp == OVS_READ_DEV_OP);
1085 if (instance->dumpState.ovsMsg == NULL) {
1087 return STATUS_INVALID_DEVICE_STATE;
1090 /* Dump state must have been deleted after previous dump operation. */
1091 ASSERT(instance->dumpState.index[0] == 0);
1092 /* Output buffer has been validated while validating read dev op. */
1093 ASSERT(msgOut != NULL && usrParamsCtx->outputLength >= sizeof *msgOut);
1095 NlBufInit(&nlBuf, usrParamsCtx->outputBuffer,
1096 usrParamsCtx->outputLength);
1098 OvsAcquireCtrlLock();
1099 if (!gOvsSwitchContext) {
1100 /* Treat this as a dump done. */
1101 OvsReleaseCtrlLock();
1103 FreeUserDumpState(instance);
1104 return STATUS_SUCCESS;
1106 status = OvsDpFillInfo(gOvsSwitchContext, msgIn, &nlBuf);
1107 OvsReleaseCtrlLock();
1109 if (status != STATUS_SUCCESS) {
1111 FreeUserDumpState(instance);
1115 /* Increment the dump index. */
1116 instance->dumpState.index[0] = 1;
1117 *replyLen = msgOut->nlMsg.nlmsgLen;
1119 /* Free up the dump state, since there's no more data to continue. */
1120 FreeUserDumpState(instance);
1123 return STATUS_SUCCESS;
1128 * --------------------------------------------------------------------------
1129 * Command Handler for 'OVS_DP_CMD_SET'.
1130 * --------------------------------------------------------------------------
1133 OvsSetDpCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1136 return HandleDpTransaction(usrParamsCtx, replyLen);
1140 * --------------------------------------------------------------------------
1141 * Function for handling transaction based 'OVS_DP_CMD_GET' and
1142 * 'OVS_DP_CMD_SET' commands.
1143 * --------------------------------------------------------------------------
1146 HandleDpTransaction(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1149 POVS_MESSAGE msgIn = (POVS_MESSAGE)usrParamsCtx->inputBuffer;
1150 POVS_MESSAGE msgOut = (POVS_MESSAGE)usrParamsCtx->outputBuffer;
1151 NTSTATUS status = STATUS_SUCCESS;
1153 static const NL_POLICY ovsDatapathSetPolicy[] = {
1154 [OVS_DP_ATTR_NAME] = { .type = NL_A_STRING, .maxLen = IFNAMSIZ },
1155 [OVS_DP_ATTR_UPCALL_PID] = { .type = NL_A_U32, .optional = TRUE },
1156 [OVS_DP_ATTR_USER_FEATURES] = { .type = NL_A_U32, .optional = TRUE },
1158 PNL_ATTR dpAttrs[ARRAY_SIZE(ovsDatapathSetPolicy)];
1160 /* input buffer has been validated while validating write dev op. */
1161 ASSERT(msgIn != NULL && usrParamsCtx->inputLength >= sizeof *msgIn);
1163 /* Parse any attributes in the request. */
1164 if (usrParamsCtx->ovsMsg->genlMsg.cmd == OVS_DP_CMD_SET) {
1165 if (!NlAttrParse((PNL_MSG_HDR)msgIn,
1166 NLMSG_HDRLEN + GENL_HDRLEN + OVS_HDRLEN,
1167 NlMsgAttrsLen((PNL_MSG_HDR)msgIn),
1168 ovsDatapathSetPolicy, dpAttrs, ARRAY_SIZE(dpAttrs))) {
1169 return STATUS_INVALID_PARAMETER;
1173 * XXX: Not clear at this stage if there's any role for the
1174 * OVS_DP_ATTR_UPCALL_PID and OVS_DP_ATTR_USER_FEATURES attributes passed
1179 RtlZeroMemory(dpAttrs, sizeof dpAttrs);
1182 /* Output buffer is optional for OVS_TRANSACTION_DEV_OP. */
1183 if (msgOut == NULL || usrParamsCtx->outputLength < sizeof *msgOut) {
1184 return STATUS_NDIS_INVALID_LENGTH;
1186 NlBufInit(&nlBuf, usrParamsCtx->outputBuffer, usrParamsCtx->outputLength);
1188 OvsAcquireCtrlLock();
1189 if (dpAttrs[OVS_DP_ATTR_NAME] != NULL) {
1190 if (!gOvsSwitchContext &&
1191 !OvsCompareString(NlAttrGet(dpAttrs[OVS_DP_ATTR_NAME]),
1192 OVS_SYSTEM_DP_NAME)) {
1193 OvsReleaseCtrlLock();
1194 status = STATUS_NOT_FOUND;
1197 } else if ((UINT32)msgIn->ovsHdr.dp_ifindex != gOvsSwitchContext->dpNo) {
1198 OvsReleaseCtrlLock();
1199 status = STATUS_NOT_FOUND;
1203 status = OvsDpFillInfo(gOvsSwitchContext, msgIn, &nlBuf);
1204 OvsReleaseCtrlLock();
1206 *replyLen = NlBufSize(&nlBuf);
1214 OvsSetupDumpStart(POVS_USER_PARAMS_CONTEXT usrParamsCtx)
1216 POVS_MESSAGE msgIn = (POVS_MESSAGE)usrParamsCtx->inputBuffer;
1217 POVS_OPEN_INSTANCE instance =
1218 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
1220 /* input buffer has been validated while validating write dev op. */
1221 ASSERT(msgIn != NULL && usrParamsCtx->inputLength >= sizeof *msgIn);
1223 /* A write operation that does not indicate dump start is invalid. */
1224 if ((msgIn->nlMsg.nlmsgFlags & NLM_F_DUMP) != NLM_F_DUMP) {
1225 return STATUS_INVALID_PARAMETER;
1227 /* XXX: Handle other NLM_F_* flags in the future. */
1230 * This operation should be setting up the dump state. If there's any
1231 * previous state, clear it up so as to set it up afresh.
1233 if (instance->dumpState.ovsMsg != NULL) {
1234 FreeUserDumpState(instance);
1237 return InitUserDumpState(instance, msgIn);
1241 BuildMsgOut(POVS_MESSAGE msgIn, POVS_MESSAGE msgOut, UINT16 type,
1242 UINT32 length, UINT16 flags)
1244 msgOut->nlMsg.nlmsgType = type;
1245 msgOut->nlMsg.nlmsgFlags = flags;
1246 msgOut->nlMsg.nlmsgSeq = msgIn->nlMsg.nlmsgSeq;
1247 msgOut->nlMsg.nlmsgPid = msgIn->nlMsg.nlmsgPid;
1248 msgOut->nlMsg.nlmsgLen = length;
1250 msgOut->genlMsg.cmd = msgIn->genlMsg.cmd;
1251 msgOut->genlMsg.version = nlDatapathFamilyOps.version;
1252 msgOut->genlMsg.reserved = 0;
1256 BuildReplyMsgFromMsgIn(POVS_MESSAGE msgIn, POVS_MESSAGE msgOut, UINT16 flags)
1258 BuildMsgOut(msgIn, msgOut, msgIn->nlMsg.nlmsgType, sizeof(OVS_MESSAGE),
1263 BuildErrorMsg(POVS_MESSAGE msgIn, POVS_MESSAGE_ERROR msgOut, UINT errorCode)
1265 BuildMsgOut(msgIn, (POVS_MESSAGE)msgOut, NLMSG_ERROR,
1266 sizeof(OVS_MESSAGE_ERROR), 0);
1268 msgOut->errorMsg.error = errorCode;
1269 msgOut->errorMsg.nlMsg = msgIn->nlMsg;
1273 OvsCreateMsgFromVport(POVS_VPORT_ENTRY vport,
1280 OVS_VPORT_FULL_STATS vportStats;
1285 NlBufInit(&nlBuffer, outBuffer, outBufLen);
1287 BuildReplyMsgFromMsgIn(msgIn, &msgOut, NLM_F_MULTI);
1288 msgOut.ovsHdr.dp_ifindex = dpIfIndex;
1290 ok = NlMsgPutHead(&nlBuffer, (PCHAR)&msgOut, sizeof msgOut);
1292 return STATUS_INSUFFICIENT_RESOURCES;
1295 ok = NlMsgPutTailU32(&nlBuffer, OVS_VPORT_ATTR_PORT_NO, vport->portNo);
1297 return STATUS_INSUFFICIENT_RESOURCES;
1300 ok = NlMsgPutTailU32(&nlBuffer, OVS_VPORT_ATTR_TYPE, vport->ovsType);
1302 return STATUS_INSUFFICIENT_RESOURCES;
1305 ok = NlMsgPutTailString(&nlBuffer, OVS_VPORT_ATTR_NAME, vport->ovsName);
1307 return STATUS_INSUFFICIENT_RESOURCES;
1311 * XXX: when we implement OVS_DP_ATTR_USER_FEATURES in datapath,
1312 * we'll need to check the OVS_DP_F_VPORT_PIDS flag: if it is set,
1313 * it means we have an array of pids, instead of a single pid.
1314 * ATM we assume we have one pid only.
1317 ok = NlMsgPutTailU32(&nlBuffer, OVS_VPORT_ATTR_UPCALL_PID,
1320 return STATUS_INSUFFICIENT_RESOURCES;
1324 vportStats.rxPackets = vport->stats.rxPackets;
1325 vportStats.rxBytes = vport->stats.rxBytes;
1326 vportStats.txPackets = vport->stats.txPackets;
1327 vportStats.txBytes = vport->stats.txBytes;
1328 vportStats.rxErrors = vport->errStats.rxErrors;
1329 vportStats.txErrors = vport->errStats.txErrors;
1330 vportStats.rxDropped = vport->errStats.rxDropped;
1331 vportStats.txDropped = vport->errStats.txDropped;
1333 ok = NlMsgPutTailUnspec(&nlBuffer, OVS_VPORT_ATTR_STATS,
1335 sizeof(OVS_VPORT_FULL_STATS));
1337 return STATUS_INSUFFICIENT_RESOURCES;
1341 * XXX: when vxlan udp dest port becomes configurable, we will also need
1342 * to add vport options
1345 nlMsg = (PNL_MSG_HDR)NlBufAt(&nlBuffer, 0, 0);
1346 nlMsg->nlmsgLen = NlBufSize(&nlBuffer);
1348 return STATUS_SUCCESS;
1352 OvsGetVportDumpNext(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1356 POVS_OPEN_INSTANCE instance =
1357 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
1358 LOCK_STATE_EX lockState;
1359 UINT32 i = OVS_MAX_VPORT_ARRAY_SIZE;
1362 * XXX: this function shares some code with other dump command(s).
1363 * In the future, we will need to refactor the dump functions
1366 ASSERT(usrParamsCtx->devOp == OVS_READ_DEV_OP);
1368 if (instance->dumpState.ovsMsg == NULL) {
1370 return STATUS_INVALID_DEVICE_STATE;
1373 /* Output buffer has been validated while validating read dev op. */
1374 ASSERT(usrParamsCtx->outputBuffer != NULL);
1376 msgIn = instance->dumpState.ovsMsg;
1378 OvsAcquireCtrlLock();
1379 if (!gOvsSwitchContext) {
1380 /* Treat this as a dump done. */
1381 OvsReleaseCtrlLock();
1383 FreeUserDumpState(instance);
1384 return STATUS_SUCCESS;
1388 * XXX: when we implement OVS_DP_ATTR_USER_FEATURES in datapath,
1389 * we'll need to check the OVS_DP_F_VPORT_PIDS flag: if it is set,
1390 * it means we have an array of pids, instead of a single pid.
1391 * ATM we assume we have one pid only.
1394 NdisAcquireRWLockRead(gOvsSwitchContext->dispatchLock, &lockState, 0);
1396 if (gOvsSwitchContext->numVports > 0) {
1397 /* inBucket: the bucket, used for lookup */
1398 UINT32 inBucket = instance->dumpState.index[0];
1399 /* inIndex: index within the given bucket, used for lookup */
1400 UINT32 inIndex = instance->dumpState.index[1];
1401 /* the bucket to be used for the next dump operation */
1402 UINT32 outBucket = 0;
1403 /* the index within the outBucket to be used for the next dump */
1404 UINT32 outIndex = 0;
1406 for (i = inBucket; i < OVS_MAX_VPORT_ARRAY_SIZE; i++) {
1407 PLIST_ENTRY head, link;
1408 head = &(gOvsSwitchContext->portHashArray[i]);
1409 POVS_VPORT_ENTRY vport = NULL;
1412 LIST_FORALL(head, link) {
1415 * if one or more dumps were previously done on this same bucket,
1416 * inIndex will be > 0, so we'll need to reply with the
1417 * inIndex + 1 vport from the bucket.
1419 if (outIndex >= inIndex) {
1420 vport = CONTAINING_RECORD(link, OVS_VPORT_ENTRY, portLink);
1422 if (vport->portNo != 0) {
1423 OvsCreateMsgFromVport(vport, msgIn,
1424 usrParamsCtx->outputBuffer,
1425 usrParamsCtx->outputLength,
1426 gOvsSwitchContext->dpNo);
1442 * if no vport was found above, check the next bucket, beginning
1443 * with the first (i.e. index 0) elem from within that bucket
1450 /* XXX: what about NLMSG_DONE (as msg type)? */
1451 instance->dumpState.index[0] = outBucket;
1452 instance->dumpState.index[1] = outIndex;
1455 NdisReleaseRWLock(gOvsSwitchContext->dispatchLock, &lockState);
1457 OvsReleaseCtrlLock();
1459 /* if i < OVS_MAX_VPORT_ARRAY_SIZE => vport was found */
1460 if (i < OVS_MAX_VPORT_ARRAY_SIZE) {
1461 POVS_MESSAGE msgOut = (POVS_MESSAGE)usrParamsCtx->outputBuffer;
1462 *replyLen = msgOut->nlMsg.nlmsgLen;
1465 * if i >= OVS_MAX_VPORT_ARRAY_SIZE => vport was not found =>
1469 /* Free up the dump state, since there's no more data to continue. */
1470 FreeUserDumpState(instance);
1473 return STATUS_SUCCESS;
1477 OvsGetVport(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1480 NTSTATUS status = STATUS_SUCCESS;
1481 LOCK_STATE_EX lockState;
1483 POVS_MESSAGE msgIn = (POVS_MESSAGE)usrParamsCtx->inputBuffer;
1484 POVS_MESSAGE msgOut = (POVS_MESSAGE)usrParamsCtx->outputBuffer;
1485 POVS_VPORT_ENTRY vport = NULL;
1486 NL_ERROR nlError = NL_ERROR_SUCCESS;
1488 static const NL_POLICY ovsVportPolicy[] = {
1489 [OVS_VPORT_ATTR_PORT_NO] = { .type = NL_A_U32, .optional = TRUE },
1490 [OVS_VPORT_ATTR_NAME] = { .type = NL_A_STRING,
1495 PNL_ATTR vportAttrs[ARRAY_SIZE(ovsVportPolicy)];
1497 /* input buffer has been validated while validating write dev op. */
1498 ASSERT(usrParamsCtx->inputBuffer != NULL);
1500 if (!NlAttrParse((PNL_MSG_HDR)msgIn,
1501 NLMSG_HDRLEN + GENL_HDRLEN + OVS_HDRLEN,
1502 ovsVportPolicy, vportAttrs, ARRAY_SIZE(vportAttrs))) {
1503 return STATUS_INVALID_PARAMETER;
1506 if (msgOut == NULL || usrParamsCtx->outputLength < sizeof *msgOut) {
1507 return STATUS_INVALID_BUFFER_SIZE;
1510 OvsAcquireCtrlLock();
1511 if (!gOvsSwitchContext) {
1512 OvsReleaseCtrlLock();
1513 return STATUS_INVALID_PARAMETER;
1515 OvsReleaseCtrlLock();
1517 if (vportAttrs[OVS_VPORT_ATTR_NAME] != NULL) {
1518 vport = OvsFindVportByOvsName(gOvsSwitchContext,
1519 NlAttrGet(vportAttrs[OVS_VPORT_ATTR_NAME]),
1520 NlAttrGetSize(vportAttrs[OVS_VPORT_ATTR_NAME]) - 1);
1521 } else if (vportAttrs[OVS_VPORT_ATTR_PORT_NO] != NULL) {
1522 vport = OvsFindVportByPortNo(gOvsSwitchContext,
1523 NlAttrGetU32(vportAttrs[OVS_VPORT_ATTR_PORT_NO]));
1525 nlError = NL_ERROR_INVAL;
1530 nlError = NL_ERROR_NODEV;
1534 NdisAcquireRWLockRead(gOvsSwitchContext->dispatchLock, &lockState, 0);
1535 status = OvsCreateMsgFromVport(vport, msgIn, usrParamsCtx->outputBuffer,
1536 usrParamsCtx->outputLength,
1537 gOvsSwitchContext->dpNo);
1538 NdisReleaseRWLock(gOvsSwitchContext->dispatchLock, &lockState);
1540 *replyLen = msgOut->nlMsg.nlmsgLen;
1543 if (nlError != NL_ERROR_SUCCESS) {
1544 POVS_MESSAGE_ERROR msgError = (POVS_MESSAGE_ERROR)
1545 usrParamsCtx->outputBuffer;
1547 BuildErrorMsg(msgIn, msgError, nlError);
1548 *replyLen = msgError->nlMsg.nlmsgLen;
1551 return STATUS_SUCCESS;
1555 * --------------------------------------------------------------------------
1556 * Handler for the get vport command. The function handles the initial call to
1557 * setup the dump state, as well as subsequent calls to continue dumping data.
1558 * --------------------------------------------------------------------------
1561 OvsGetVportCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1566 switch (usrParamsCtx->devOp)
1568 case OVS_WRITE_DEV_OP:
1569 return OvsSetupDumpStart(usrParamsCtx);
1571 case OVS_READ_DEV_OP:
1572 return OvsGetVportDumpNext(usrParamsCtx, replyLen);
1574 case OVS_TRANSACTION_DEV_OP:
1575 return OvsGetVport(usrParamsCtx, replyLen);
1578 return STATUS_INVALID_DEVICE_REQUEST;
1584 * --------------------------------------------------------------------------
1585 * Utility function to map the output buffer in an IRP. The buffer is assumed
1586 * to have been passed down using METHOD_OUT_DIRECT (Direct I/O).
1587 * --------------------------------------------------------------------------
1590 MapIrpOutputBuffer(PIRP irp,
1591 UINT32 bufferLength,
1592 UINT32 requiredLength,
1597 ASSERT(bufferLength);
1598 ASSERT(requiredLength);
1599 if (!buffer || !irp || bufferLength == 0 || requiredLength == 0) {
1600 return STATUS_INVALID_PARAMETER;
1603 if (bufferLength < requiredLength) {
1604 return STATUS_NDIS_INVALID_LENGTH;
1606 if (irp->MdlAddress == NULL) {
1607 return STATUS_INVALID_PARAMETER;
1609 *buffer = MmGetSystemAddressForMdlSafe(irp->MdlAddress,
1610 NormalPagePriority);
1611 if (*buffer == NULL) {
1612 return STATUS_INSUFFICIENT_RESOURCES;
1615 return STATUS_SUCCESS;
1619 * --------------------------------------------------------------------------
1620 * Utility function to fill up information about the state of a port in a reply
1622 * Assumes that 'gOvsCtrlLock' lock is acquired.
1623 * --------------------------------------------------------------------------
1626 OvsPortFillInfo(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1627 POVS_EVENT_ENTRY eventEntry,
1632 OVS_MESSAGE msgOutTmp;
1634 POVS_VPORT_ENTRY vport;
1636 ASSERT(NlBufAt(nlBuf, 0, 0) != 0 && nlBuf->bufRemLen >= sizeof msgOutTmp);
1638 msgOutTmp.nlMsg.nlmsgType = OVS_WIN_NL_VPORT_FAMILY_ID;
1639 msgOutTmp.nlMsg.nlmsgFlags = 0; /* XXX: ? */
1641 /* driver intiated messages should have zerp seq number*/
1642 msgOutTmp.nlMsg.nlmsgSeq = 0;
1643 msgOutTmp.nlMsg.nlmsgPid = usrParamsCtx->ovsInstance->pid;
1645 msgOutTmp.genlMsg.version = nlVportFamilyOps.version;
1646 msgOutTmp.genlMsg.reserved = 0;
1648 /* we don't have netdev yet, treat link up/down a adding/removing a port*/
1649 if (eventEntry->status & (OVS_EVENT_LINK_UP | OVS_EVENT_CONNECT)) {
1650 msgOutTmp.genlMsg.cmd = OVS_VPORT_CMD_NEW;
1651 } else if (eventEntry->status &
1652 (OVS_EVENT_LINK_DOWN | OVS_EVENT_DISCONNECT)) {
1653 msgOutTmp.genlMsg.cmd = OVS_VPORT_CMD_DEL;
1656 return STATUS_UNSUCCESSFUL;
1658 msgOutTmp.ovsHdr.dp_ifindex = gOvsSwitchContext->dpNo;
1660 rc = NlMsgPutHead(nlBuf, (PCHAR)&msgOutTmp, sizeof msgOutTmp);
1662 status = STATUS_INVALID_BUFFER_SIZE;
1666 vport = OvsFindVportByPortNo(gOvsSwitchContext, eventEntry->portNo);
1668 status = STATUS_DEVICE_DOES_NOT_EXIST;
1672 rc = NlMsgPutTailU32(nlBuf, OVS_VPORT_ATTR_PORT_NO, eventEntry->portNo) ||
1673 NlMsgPutTailU32(nlBuf, OVS_VPORT_ATTR_TYPE, vport->ovsType) ||
1674 NlMsgPutTailString(nlBuf, OVS_VPORT_ATTR_NAME, vport->ovsName);
1676 status = STATUS_INVALID_BUFFER_SIZE;
1680 /* XXXX Should we add the port stats attributes?*/
1681 nlMsg = (PNL_MSG_HDR)NlBufAt(nlBuf, 0, 0);
1682 nlMsg->nlmsgLen = NlBufSize(nlBuf);
1683 status = STATUS_SUCCESS;
1691 * --------------------------------------------------------------------------
1692 * Handler for reading events from the driver event queue. This handler is
1693 * executed when user modes issues a socket receive on a socket assocaited
1694 * with the MC group for events.
1695 * XXX user mode should read multiple events in one system call
1696 * --------------------------------------------------------------------------
1699 OvsReadEventCmdHandler(POVS_USER_PARAMS_CONTEXT usrParamsCtx,
1703 POVS_MESSAGE msgOut = (POVS_MESSAGE)usrParamsCtx->outputBuffer;
1704 POVS_OPEN_INSTANCE instance =
1705 (POVS_OPEN_INSTANCE)usrParamsCtx->ovsInstance;
1709 OVS_EVENT_ENTRY eventEntry;
1711 ASSERT(usrParamsCtx->devOp == OVS_READ_DEV_OP);
1713 /* Should never read events with a dump socket */
1714 ASSERT(instance->dumpState.ovsMsg == NULL);
1716 /* Must have an event queue */
1717 ASSERT(instance->eventQueue != NULL);
1719 /* Output buffer has been validated while validating read dev op. */
1720 ASSERT(msgOut != NULL && usrParamsCtx->outputLength >= sizeof *msgOut);
1722 NlBufInit(&nlBuf, usrParamsCtx->outputBuffer, usrParamsCtx->outputLength);
1724 OvsAcquireCtrlLock();
1725 if (!gOvsSwitchContext) {
1726 status = STATUS_SUCCESS;
1730 /* remove an event entry from the event queue */
1731 status = OvsRemoveEventEntry(usrParamsCtx->ovsInstance, &eventEntry);
1732 if (status != STATUS_SUCCESS) {
1736 status = OvsPortFillInfo(usrParamsCtx, &eventEntry, &nlBuf);
1737 if (status == NDIS_STATUS_SUCCESS) {
1738 *replyLen = NlBufSize(&nlBuf);
1742 OvsReleaseCtrlLock();
1745 #endif /* OVS_USE_NL_INTERFACE */